xref: /petsc/src/mat/impls/nest/matnest.c (revision 28b400f66ebc7ae0049166a2294dfcd3df27e64b)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*);
706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat);
806a1af2fSStefano Zampini 
95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
10c8883902SJed Brown 
11d8588912SDave May /* private functions */
128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
13d8588912SDave May {
14d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
158188e55aSJed Brown   PetscInt       i,j;
16d8588912SDave May 
17d8588912SDave May   PetscFunctionBegin;
188188e55aSJed Brown   *m = *n = *M = *N = 0;
198188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
208188e55aSJed Brown     PetscInt sm,sM;
215f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(bA->isglobal.row[i],&sm));
225f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bA->isglobal.row[i],&sM));
238188e55aSJed Brown     *m  += sm;
248188e55aSJed Brown     *M  += sM;
25d8588912SDave May   }
268188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
278188e55aSJed Brown     PetscInt sn,sN;
285f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(bA->isglobal.col[j],&sn));
295f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bA->isglobal.col[j],&sN));
308188e55aSJed Brown     *n  += sn;
318188e55aSJed Brown     *N  += sN;
32d8588912SDave May   }
33d8588912SDave May   PetscFunctionReturn(0);
34d8588912SDave May }
35d8588912SDave May 
36d8588912SDave May /* operations */
37207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
38d8588912SDave May {
39d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
40207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
41207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
42d8588912SDave May 
43d8588912SDave May   PetscFunctionBegin;
445f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecGetSubVector(y,bA->isglobal.row[i],&by[i]));
455f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecGetSubVector(x,bA->isglobal.col[i],&bx[i]));
46207556f9SJed Brown   for (i=0; i<nr; i++) {
475f80ce2aSJacob Faibussowitsch     CHKERRQ(VecZeroEntries(by[i]));
48207556f9SJed Brown     for (j=0; j<nc; j++) {
49207556f9SJed Brown       if (!bA->m[i][j]) continue;
50d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
515f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]));
52d8588912SDave May     }
53d8588912SDave May   }
545f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]));
555f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]));
56d8588912SDave May   PetscFunctionReturn(0);
57d8588912SDave May }
58d8588912SDave May 
599194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
609194d70fSJed Brown {
619194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
629194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
639194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
649194d70fSJed Brown 
659194d70fSJed Brown   PetscFunctionBegin;
665f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecGetSubVector(z,bA->isglobal.row[i],&bz[i]));
675f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecGetSubVector(x,bA->isglobal.col[i],&bx[i]));
689194d70fSJed Brown   for (i=0; i<nr; i++) {
699194d70fSJed Brown     if (y != z) {
709194d70fSJed Brown       Vec by;
715f80ce2aSJacob Faibussowitsch       CHKERRQ(VecGetSubVector(y,bA->isglobal.row[i],&by));
725f80ce2aSJacob Faibussowitsch       CHKERRQ(VecCopy(by,bz[i]));
735f80ce2aSJacob Faibussowitsch       CHKERRQ(VecRestoreSubVector(y,bA->isglobal.row[i],&by));
749194d70fSJed Brown     }
759194d70fSJed Brown     for (j=0; j<nc; j++) {
769194d70fSJed Brown       if (!bA->m[i][j]) continue;
779194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
785f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]));
799194d70fSJed Brown     }
809194d70fSJed Brown   }
815f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]));
825f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]));
839194d70fSJed Brown   PetscFunctionReturn(0);
849194d70fSJed Brown }
859194d70fSJed Brown 
8652c5f739Sprj- typedef struct {
8752c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
8852c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
8952c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9052c5f739Sprj- } Nest_Dense;
9152c5f739Sprj- 
926718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C)
9352c5f739Sprj- {
946718818eSStefano Zampini   Mat_Nest          *bA;
9552c5f739Sprj-   Nest_Dense        *contents;
966718818eSStefano Zampini   Mat               viewB,viewC,productB,workC;
9752c5f739Sprj-   const PetscScalar *barray;
9852c5f739Sprj-   PetscScalar       *carray;
996718818eSStefano Zampini   PetscInt          i,j,M,N,nr,nc,ldb,ldc;
1006718818eSStefano Zampini   Mat               A,B;
10152c5f739Sprj- 
10252c5f739Sprj-   PetscFunctionBegin;
1036718818eSStefano Zampini   MatCheckProduct(C,3);
1046718818eSStefano Zampini   A    = C->product->A;
1056718818eSStefano Zampini   B    = C->product->B;
1065f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(B,NULL,&N));
1076718818eSStefano Zampini   if (!N) {
1085f80ce2aSJacob Faibussowitsch     CHKERRQ(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY));
1095f80ce2aSJacob Faibussowitsch     CHKERRQ(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY));
1106718818eSStefano Zampini     PetscFunctionReturn(0);
1116718818eSStefano Zampini   }
1126718818eSStefano Zampini   contents = (Nest_Dense*)C->product->data;
113*28b400f6SJacob Faibussowitsch   PetscCheck(contents,PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty");
1146718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1156718818eSStefano Zampini   nr   = bA->nr;
1166718818eSStefano Zampini   nc   = bA->nc;
1175f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetLDA(B,&ldb));
1185f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetLDA(C,&ldc));
1195f80ce2aSJacob Faibussowitsch   CHKERRQ(MatZeroEntries(C));
1205f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetArrayRead(B,&barray));
1215f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetArray(C,&carray));
12252c5f739Sprj-   for (i=0; i<nr; i++) {
1235f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bA->isglobal.row[i],&M));
1245f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC));
1255f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDenseSetLDA(viewC,ldc));
12652c5f739Sprj-     for (j=0; j<nc; j++) {
12752c5f739Sprj-       if (!bA->m[i][j]) continue;
1285f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetSize(bA->isglobal.col[j],&M));
1295f80ce2aSJacob Faibussowitsch       CHKERRQ(MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB));
1305f80ce2aSJacob Faibussowitsch       CHKERRQ(MatDenseSetLDA(viewB,ldb));
1314222ddf1SHong Zhang 
1324222ddf1SHong Zhang       /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */
1334222ddf1SHong Zhang       workC             = contents->workC[i*nc + j];
1344222ddf1SHong Zhang       productB          = workC->product->B;
1354222ddf1SHong Zhang       workC->product->B = viewB; /* use newly created dense matrix viewB */
1365f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductNumeric(workC));
1375f80ce2aSJacob Faibussowitsch       CHKERRQ(MatDestroy(&viewB));
1384222ddf1SHong Zhang       workC->product->B = productB; /* resume original B */
1394222ddf1SHong Zhang 
14052c5f739Sprj-       /* C[i] <- workC + C[i] */
1415f80ce2aSJacob Faibussowitsch       CHKERRQ(MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN));
14252c5f739Sprj-     }
1435f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDestroy(&viewC));
14452c5f739Sprj-   }
1455f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseRestoreArray(C,&carray));
1465f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseRestoreArrayRead(B,&barray));
1474222ddf1SHong Zhang 
1485f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY));
1495f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY));
15052c5f739Sprj-   PetscFunctionReturn(0);
15152c5f739Sprj- }
15252c5f739Sprj- 
15352c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
15452c5f739Sprj- {
15552c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
15652c5f739Sprj-   PetscInt       i;
15752c5f739Sprj- 
15852c5f739Sprj-   PetscFunctionBegin;
1595f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(contents->tarray));
16052c5f739Sprj-   for (i=0; i<contents->k; i++) {
1615f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDestroy(contents->workC + i));
16252c5f739Sprj-   }
1635f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree3(contents->dm,contents->dn,contents->workC));
1645f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(contents));
16552c5f739Sprj-   PetscFunctionReturn(0);
16652c5f739Sprj- }
16752c5f739Sprj- 
1686718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C)
16952c5f739Sprj- {
1706718818eSStefano Zampini   Mat_Nest          *bA;
1716718818eSStefano Zampini   Mat               viewB,workC;
17252c5f739Sprj-   const PetscScalar *barray;
1736718818eSStefano Zampini   PetscInt          i,j,M,N,m,n,nr,nc,maxm = 0,ldb;
1744222ddf1SHong Zhang   Nest_Dense        *contents=NULL;
1756718818eSStefano Zampini   PetscBool         cisdense;
1766718818eSStefano Zampini   Mat               A,B;
1776718818eSStefano Zampini   PetscReal         fill;
17852c5f739Sprj- 
17952c5f739Sprj-   PetscFunctionBegin;
1806718818eSStefano Zampini   MatCheckProduct(C,4);
181*28b400f6SJacob Faibussowitsch   PetscCheck(!C->product->data,PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty");
1826718818eSStefano Zampini   A    = C->product->A;
1836718818eSStefano Zampini   B    = C->product->B;
1846718818eSStefano Zampini   fill = C->product->fill;
1856718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1866718818eSStefano Zampini   nr   = bA->nr;
1876718818eSStefano Zampini   nc   = bA->nc;
1885f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetLocalSize(C,&m,&n));
1895f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(C,&M,&N));
1900572eedcSPierre Jolivet   if (m == PETSC_DECIDE || n == PETSC_DECIDE || M == PETSC_DECIDE || N == PETSC_DECIDE) {
1915f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetLocalSize(B,NULL,&n));
1925f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetSize(B,NULL,&N));
1935f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetLocalSize(A,&m,NULL));
1945f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetSize(A,&M,NULL));
1955f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetSizes(C,m,n,M,N));
1960572eedcSPierre Jolivet   }
1975f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,""));
1986718818eSStefano Zampini   if (!cisdense) {
1995f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetType(C,((PetscObject)B)->type_name));
2006718818eSStefano Zampini   }
2015f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetUp(C));
2026718818eSStefano Zampini   if (!N) {
2036718818eSStefano Zampini     C->ops->productnumeric = MatProductNumeric_Nest_Dense;
2046718818eSStefano Zampini     PetscFunctionReturn(0);
20552c5f739Sprj-   }
20652c5f739Sprj- 
2075f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscNew(&contents));
2086718818eSStefano Zampini   C->product->data = contents;
2096718818eSStefano Zampini   C->product->destroy = MatNest_DenseDestroy;
2105f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC));
21152c5f739Sprj-   contents->k = nr*nc;
21252c5f739Sprj-   for (i=0; i<nr; i++) {
2135f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1));
21452c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
21552c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
21652c5f739Sprj-   }
21752c5f739Sprj-   for (i=0; i<nc; i++) {
2185f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1));
21952c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
22052c5f739Sprj-   }
2215f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(maxm*N,&contents->tarray));
2225f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetLDA(B,&ldb));
2235f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(B,NULL,&N));
2245f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseGetArrayRead(B,&barray));
22552c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
22652c5f739Sprj-   for (j=0; j<nc; j++) {
2275f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bA->isglobal.col[j],&M));
2285f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB));
2295f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDenseSetLDA(viewB,ldb));
23052c5f739Sprj-     for (i=0; i<nr; i++) {
23152c5f739Sprj-       if (!bA->m[i][j]) continue;
23252c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
2334222ddf1SHong Zhang 
2345f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]));
2354222ddf1SHong Zhang       workC = contents->workC[i*nc + j];
2365f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductSetType(workC,MATPRODUCT_AB));
2375f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductSetAlgorithm(workC,"default"));
2385f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductSetFill(workC,fill));
2395f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductSetFromOptions(workC));
2405f80ce2aSJacob Faibussowitsch       CHKERRQ(MatProductSymbolic(workC));
2414222ddf1SHong Zhang 
2426718818eSStefano Zampini       /* since tarray will be shared by all Mat */
2435f80ce2aSJacob Faibussowitsch       CHKERRQ(MatSeqDenseSetPreallocation(workC,contents->tarray));
2445f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMPIDenseSetPreallocation(workC,contents->tarray));
24552c5f739Sprj-     }
2465f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDestroy(&viewB));
24752c5f739Sprj-   }
2485f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDenseRestoreArrayRead(B,&barray));
24952c5f739Sprj- 
2506718818eSStefano Zampini   C->ops->productnumeric = MatProductNumeric_Nest_Dense;
25152c5f739Sprj-   PetscFunctionReturn(0);
25252c5f739Sprj- }
25352c5f739Sprj- 
2544222ddf1SHong Zhang /* --------------------------------------------------------- */
2554222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C)
2564222ddf1SHong Zhang {
2574222ddf1SHong Zhang   PetscFunctionBegin;
2586718818eSStefano Zampini   C->ops->productsymbolic = MatProductSymbolic_Nest_Dense;
2594222ddf1SHong Zhang   PetscFunctionReturn(0);
2604222ddf1SHong Zhang }
2614222ddf1SHong Zhang 
2624222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C)
26352c5f739Sprj- {
2644222ddf1SHong Zhang   Mat_Product    *product = C->product;
26552c5f739Sprj- 
26652c5f739Sprj-   PetscFunctionBegin;
2674222ddf1SHong Zhang   if (product->type == MATPRODUCT_AB) {
2685f80ce2aSJacob Faibussowitsch     CHKERRQ(MatProductSetFromOptions_Nest_Dense_AB(C));
2696718818eSStefano Zampini   }
27052c5f739Sprj-   PetscFunctionReturn(0);
27152c5f739Sprj- }
2724222ddf1SHong Zhang /* --------------------------------------------------------- */
27352c5f739Sprj- 
274207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
275d8588912SDave May {
276d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
277207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
278207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
279d8588912SDave May 
280d8588912SDave May   PetscFunctionBegin;
2815f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecGetSubVector(x,bA->isglobal.row[i],&bx[i]));
2825f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecGetSubVector(y,bA->isglobal.col[i],&by[i]));
283207556f9SJed Brown   for (j=0; j<nc; j++) {
2845f80ce2aSJacob Faibussowitsch     CHKERRQ(VecZeroEntries(by[j]));
285609e31cbSJed Brown     for (i=0; i<nr; i++) {
2866c75ac25SJed Brown       if (!bA->m[i][j]) continue;
287609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
2885f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]));
289d8588912SDave May     }
290d8588912SDave May   }
2915f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]));
2925f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]));
293d8588912SDave May   PetscFunctionReturn(0);
294d8588912SDave May }
295d8588912SDave May 
2969194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
2979194d70fSJed Brown {
2989194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
2999194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
3009194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
3019194d70fSJed Brown 
3029194d70fSJed Brown   PetscFunctionBegin;
3035f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecGetSubVector(x,bA->isglobal.row[i],&bx[i]));
3045f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecGetSubVector(z,bA->isglobal.col[i],&bz[i]));
3059194d70fSJed Brown   for (j=0; j<nc; j++) {
3069194d70fSJed Brown     if (y != z) {
3079194d70fSJed Brown       Vec by;
3085f80ce2aSJacob Faibussowitsch       CHKERRQ(VecGetSubVector(y,bA->isglobal.col[j],&by));
3095f80ce2aSJacob Faibussowitsch       CHKERRQ(VecCopy(by,bz[j]));
3105f80ce2aSJacob Faibussowitsch       CHKERRQ(VecRestoreSubVector(y,bA->isglobal.col[j],&by));
3119194d70fSJed Brown     }
3129194d70fSJed Brown     for (i=0; i<nr; i++) {
3136c75ac25SJed Brown       if (!bA->m[i][j]) continue;
3149194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
3155f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]));
3169194d70fSJed Brown     }
3179194d70fSJed Brown   }
3185f80ce2aSJacob Faibussowitsch   for (i=0; i<nr; i++) CHKERRQ(VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]));
3195f80ce2aSJacob Faibussowitsch   for (i=0; i<nc; i++) CHKERRQ(VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]));
3209194d70fSJed Brown   PetscFunctionReturn(0);
3219194d70fSJed Brown }
3229194d70fSJed Brown 
323f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
324f8170845SAlex Fikl {
325f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
326f8170845SAlex Fikl   Mat            C;
327f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
328f8170845SAlex Fikl 
329f8170845SAlex Fikl   PetscFunctionBegin;
3302c71b3e2SJacob Faibussowitsch   PetscCheckFalse(reuse == MAT_INPLACE_MATRIX && nr != nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
331f8170845SAlex Fikl 
332cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
333f8170845SAlex Fikl     Mat *subs;
334f8170845SAlex Fikl     IS  *is_row,*is_col;
335f8170845SAlex Fikl 
3365f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscCalloc1(nr * nc,&subs));
3375f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc2(nr,&is_row,nc,&is_col));
3385f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestGetISs(A,is_row,is_col));
339cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
340ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
341ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
342ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
343ddeb9bd8SAlex Fikl         }
344ddeb9bd8SAlex Fikl       }
345ddeb9bd8SAlex Fikl     }
346ddeb9bd8SAlex Fikl 
3475f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C));
3485f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscFree(subs));
3495f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscFree2(is_row,is_col));
350f8170845SAlex Fikl   } else {
351f8170845SAlex Fikl     C = *B;
352f8170845SAlex Fikl   }
353f8170845SAlex Fikl 
354f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
355f8170845SAlex Fikl   for (i=0; i<nr; i++) {
356f8170845SAlex Fikl     for (j=0; j<nc; j++) {
357f8170845SAlex Fikl       if (bA->m[i][j]) {
3585f80ce2aSJacob Faibussowitsch         CHKERRQ(MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i])));
359f8170845SAlex Fikl       } else {
360f8170845SAlex Fikl         bC->m[j][i] = NULL;
361f8170845SAlex Fikl       }
362f8170845SAlex Fikl     }
363f8170845SAlex Fikl   }
364f8170845SAlex Fikl 
365cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
366f8170845SAlex Fikl     *B = C;
367f8170845SAlex Fikl   } else {
3685f80ce2aSJacob Faibussowitsch     CHKERRQ(MatHeaderMerge(A, &C));
369f8170845SAlex Fikl   }
370f8170845SAlex Fikl   PetscFunctionReturn(0);
371f8170845SAlex Fikl }
372f8170845SAlex Fikl 
373e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
374e2d7f03fSJed Brown {
375e2d7f03fSJed Brown   IS             *lst = *list;
376e2d7f03fSJed Brown   PetscInt       i;
377e2d7f03fSJed Brown 
378e2d7f03fSJed Brown   PetscFunctionBegin;
379e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3805f80ce2aSJacob Faibussowitsch   for (i=0; i<n; i++) if (lst[i]) CHKERRQ(ISDestroy(&lst[i]));
3815f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(lst));
3820298fd71SBarry Smith   *list = NULL;
383e2d7f03fSJed Brown   PetscFunctionReturn(0);
384e2d7f03fSJed Brown }
385e2d7f03fSJed Brown 
38606a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A)
387d8588912SDave May {
388d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
389d8588912SDave May   PetscInt       i,j;
390d8588912SDave May 
391d8588912SDave May   PetscFunctionBegin;
392d8588912SDave May   /* release the matrices and the place holders */
3935f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestDestroyISList(vs->nr,&vs->isglobal.row));
3945f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestDestroyISList(vs->nc,&vs->isglobal.col));
3955f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestDestroyISList(vs->nr,&vs->islocal.row));
3965f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestDestroyISList(vs->nc,&vs->islocal.col));
397d8588912SDave May 
3985f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(vs->row_len));
3995f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(vs->col_len));
4005f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(vs->nnzstate));
401d8588912SDave May 
4025f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree2(vs->left,vs->right));
403207556f9SJed Brown 
404d8588912SDave May   /* release the matrices and the place holders */
405d8588912SDave May   if (vs->m) {
406d8588912SDave May     for (i=0; i<vs->nr; i++) {
407d8588912SDave May       for (j=0; j<vs->nc; j++) {
4085f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDestroy(&vs->m[i][j]));
409d8588912SDave May       }
4105f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscFree(vs->m[i]));
411d8588912SDave May     }
4125f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscFree(vs->m));
413d8588912SDave May   }
41406a1af2fSStefano Zampini 
41506a1af2fSStefano Zampini   /* restore defaults */
41606a1af2fSStefano Zampini   vs->nr = 0;
41706a1af2fSStefano Zampini   vs->nc = 0;
41806a1af2fSStefano Zampini   vs->splitassembly = PETSC_FALSE;
41906a1af2fSStefano Zampini   PetscFunctionReturn(0);
42006a1af2fSStefano Zampini }
42106a1af2fSStefano Zampini 
42206a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A)
42306a1af2fSStefano Zampini {
424362febeeSStefano Zampini   PetscFunctionBegin;
4255f80ce2aSJacob Faibussowitsch   CHKERRQ(MatReset_Nest(A));
4265f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(A->data));
4275f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",NULL));
4285f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",NULL));
4295f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",NULL));
4305f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",NULL));
4315f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",NULL));
4325f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",NULL));
4335f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",NULL));
4345f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",NULL));
4355f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",NULL));
4365f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",NULL));
4375f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",NULL));
4385f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",NULL));
4395f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",NULL));
4405f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",NULL));
4415f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL));
4425f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL));
4435f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL));
444d8588912SDave May   PetscFunctionReturn(0);
445d8588912SDave May }
446d8588912SDave May 
447381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd)
448381b8e50SStefano Zampini {
449381b8e50SStefano Zampini   Mat_Nest       *vs = (Mat_Nest*)mat->data;
450381b8e50SStefano Zampini   PetscInt       i;
451381b8e50SStefano Zampini 
452381b8e50SStefano Zampini   PetscFunctionBegin;
453381b8e50SStefano Zampini   if (dd) *dd = 0;
454381b8e50SStefano Zampini   if (!vs->nr) {
455381b8e50SStefano Zampini     *missing = PETSC_TRUE;
456381b8e50SStefano Zampini     PetscFunctionReturn(0);
457381b8e50SStefano Zampini   }
458381b8e50SStefano Zampini   *missing = PETSC_FALSE;
459381b8e50SStefano Zampini   for (i = 0; i < vs->nr && !(*missing); i++) {
460381b8e50SStefano Zampini     *missing = PETSC_TRUE;
461381b8e50SStefano Zampini     if (vs->m[i][i]) {
4625f80ce2aSJacob Faibussowitsch       CHKERRQ(MatMissingDiagonal(vs->m[i][i],missing,NULL));
4632c71b3e2SJacob Faibussowitsch       PetscCheckFalse(*missing && dd,PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented");
464381b8e50SStefano Zampini     }
465381b8e50SStefano Zampini   }
466381b8e50SStefano Zampini   PetscFunctionReturn(0);
467381b8e50SStefano Zampini }
468381b8e50SStefano Zampini 
469207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
470d8588912SDave May {
471d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
472d8588912SDave May   PetscInt       i,j;
47306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
474d8588912SDave May 
475d8588912SDave May   PetscFunctionBegin;
476d8588912SDave May   for (i=0; i<vs->nr; i++) {
477d8588912SDave May     for (j=0; j<vs->nc; j++) {
47806a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
479e7c19651SJed Brown       if (vs->m[i][j]) {
4805f80ce2aSJacob Faibussowitsch         CHKERRQ(MatAssemblyBegin(vs->m[i][j],type));
481e7c19651SJed Brown         if (!vs->splitassembly) {
482e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
483e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
484e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
485e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
486e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
487e7c19651SJed Brown            */
4885f80ce2aSJacob Faibussowitsch           CHKERRQ(MatAssemblyEnd(vs->m[i][j],type));
4895f80ce2aSJacob Faibussowitsch           CHKERRQ(MatGetNonzeroState(vs->m[i][j],&subnnzstate));
490e7c19651SJed Brown         }
491e7c19651SJed Brown       }
49206a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate);
49306a1af2fSStefano Zampini       vs->nnzstate[i*vs->nc+j] = subnnzstate;
494d8588912SDave May     }
495d8588912SDave May   }
49606a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
497d8588912SDave May   PetscFunctionReturn(0);
498d8588912SDave May }
499d8588912SDave May 
500207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
501d8588912SDave May {
502d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
503d8588912SDave May   PetscInt       i,j;
504d8588912SDave May 
505d8588912SDave May   PetscFunctionBegin;
506d8588912SDave May   for (i=0; i<vs->nr; i++) {
507d8588912SDave May     for (j=0; j<vs->nc; j++) {
508e7c19651SJed Brown       if (vs->m[i][j]) {
509e7c19651SJed Brown         if (vs->splitassembly) {
5105f80ce2aSJacob Faibussowitsch           CHKERRQ(MatAssemblyEnd(vs->m[i][j],type));
511e7c19651SJed Brown         }
512e7c19651SJed Brown       }
513d8588912SDave May     }
514d8588912SDave May   }
515d8588912SDave May   PetscFunctionReturn(0);
516d8588912SDave May }
517d8588912SDave May 
518f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
519d8588912SDave May {
520f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
521f349c1fdSJed Brown   PetscInt       j;
522f349c1fdSJed Brown   Mat            sub;
523d8588912SDave May 
524d8588912SDave May   PetscFunctionBegin;
5250298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
526f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
5275f80ce2aSJacob Faibussowitsch   if (sub) CHKERRQ(MatSetUp(sub));       /* Ensure that the sizes are available */
528f349c1fdSJed Brown   *B = sub;
529f349c1fdSJed Brown   PetscFunctionReturn(0);
530d8588912SDave May }
531d8588912SDave May 
532f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
533f349c1fdSJed Brown {
534f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
535f349c1fdSJed Brown   PetscInt       i;
536f349c1fdSJed Brown   Mat            sub;
537f349c1fdSJed Brown 
538f349c1fdSJed Brown   PetscFunctionBegin;
5390298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
540f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
5415f80ce2aSJacob Faibussowitsch   if (sub) CHKERRQ(MatSetUp(sub));       /* Ensure that the sizes are available */
542f349c1fdSJed Brown   *B = sub;
543f349c1fdSJed Brown   PetscFunctionReturn(0);
544d8588912SDave May }
545d8588912SDave May 
54618d228c0SPierre Jolivet static PetscErrorCode MatNestFindISRange(Mat A,PetscInt n,const IS list[],IS is,PetscInt *begin,PetscInt *end)
547f349c1fdSJed Brown {
54818d228c0SPierre Jolivet   PetscInt       i,j,size,m;
549f349c1fdSJed Brown   PetscBool      flg;
55018d228c0SPierre Jolivet   IS             out,concatenate[2];
551f349c1fdSJed Brown 
552f349c1fdSJed Brown   PetscFunctionBegin;
553f349c1fdSJed Brown   PetscValidPointer(list,3);
554f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
55518d228c0SPierre Jolivet   if (begin) {
55618d228c0SPierre Jolivet     PetscValidIntPointer(begin,5);
55718d228c0SPierre Jolivet     *begin = -1;
55818d228c0SPierre Jolivet   }
55918d228c0SPierre Jolivet   if (end) {
56018d228c0SPierre Jolivet     PetscValidIntPointer(end,6);
56118d228c0SPierre Jolivet     *end = -1;
56218d228c0SPierre Jolivet   }
563f349c1fdSJed Brown   for (i=0; i<n; i++) {
564207556f9SJed Brown     if (!list[i]) continue;
5655f80ce2aSJacob Faibussowitsch     CHKERRQ(ISEqualUnsorted(list[i],is,&flg));
566f349c1fdSJed Brown     if (flg) {
56718d228c0SPierre Jolivet       if (begin) *begin = i;
56818d228c0SPierre Jolivet       if (end) *end = i+1;
569f349c1fdSJed Brown       PetscFunctionReturn(0);
570f349c1fdSJed Brown     }
571f349c1fdSJed Brown   }
5725f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetSize(is,&size));
57318d228c0SPierre Jolivet   for (i=0; i<n-1; i++) {
57418d228c0SPierre Jolivet     if (!list[i]) continue;
57518d228c0SPierre Jolivet     m = 0;
5765f80ce2aSJacob Faibussowitsch     CHKERRQ(ISConcatenate(PetscObjectComm((PetscObject)A),2,list+i,&out));
5775f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(out,&m));
57818d228c0SPierre Jolivet     for (j=i+2; j<n && m<size; j++) {
57918d228c0SPierre Jolivet       if (list[j]) {
58018d228c0SPierre Jolivet         concatenate[0] = out;
58118d228c0SPierre Jolivet         concatenate[1] = list[j];
5825f80ce2aSJacob Faibussowitsch         CHKERRQ(ISConcatenate(PetscObjectComm((PetscObject)A),2,concatenate,&out));
5835f80ce2aSJacob Faibussowitsch         CHKERRQ(ISDestroy(concatenate));
5845f80ce2aSJacob Faibussowitsch         CHKERRQ(ISGetSize(out,&m));
58518d228c0SPierre Jolivet       }
58618d228c0SPierre Jolivet     }
58718d228c0SPierre Jolivet     if (m == size) {
5885f80ce2aSJacob Faibussowitsch       CHKERRQ(ISEqualUnsorted(out,is,&flg));
58918d228c0SPierre Jolivet       if (flg) {
59018d228c0SPierre Jolivet         if (begin) *begin = i;
59118d228c0SPierre Jolivet         if (end) *end = j;
5925f80ce2aSJacob Faibussowitsch         CHKERRQ(ISDestroy(&out));
59318d228c0SPierre Jolivet         PetscFunctionReturn(0);
59418d228c0SPierre Jolivet       }
59518d228c0SPierre Jolivet     }
5965f80ce2aSJacob Faibussowitsch     CHKERRQ(ISDestroy(&out));
59718d228c0SPierre Jolivet   }
59818d228c0SPierre Jolivet   PetscFunctionReturn(0);
599f349c1fdSJed Brown }
600f349c1fdSJed Brown 
60118d228c0SPierre Jolivet static PetscErrorCode MatNestFillEmptyMat_Private(Mat A,PetscInt i,PetscInt j,Mat *B)
6028188e55aSJed Brown {
6038188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
60418d228c0SPierre Jolivet   PetscInt       lr,lc;
60518d228c0SPierre Jolivet 
60618d228c0SPierre Jolivet   PetscFunctionBegin;
6075f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreate(PetscObjectComm((PetscObject)A),B));
6085f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetLocalSize(vs->isglobal.row[i],&lr));
6095f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetLocalSize(vs->isglobal.col[j],&lc));
6105f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetSizes(*B,lr,lc,PETSC_DECIDE,PETSC_DECIDE));
6115f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetType(*B,MATAIJ));
6125f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSeqAIJSetPreallocation(*B,0,NULL));
6135f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMPIAIJSetPreallocation(*B,0,NULL,0,NULL));
6145f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetUp(*B));
6155f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE));
6165f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY));
6175f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY));
61818d228c0SPierre Jolivet   PetscFunctionReturn(0);
61918d228c0SPierre Jolivet }
62018d228c0SPierre Jolivet 
62118d228c0SPierre Jolivet static PetscErrorCode MatNestGetBlock_Private(Mat A,PetscInt rbegin,PetscInt rend,PetscInt cbegin,PetscInt cend,Mat *B)
62218d228c0SPierre Jolivet {
62318d228c0SPierre Jolivet   Mat_Nest       *vs = (Mat_Nest*)A->data;
62418d228c0SPierre Jolivet   Mat            *a;
62518d228c0SPierre Jolivet   PetscInt       i,j,k,l,nr=rend-rbegin,nc=cend-cbegin;
6268188e55aSJed Brown   char           keyname[256];
62718d228c0SPierre Jolivet   PetscBool      *b;
62818d228c0SPierre Jolivet   PetscBool      flg;
6298188e55aSJed Brown 
6308188e55aSJed Brown   PetscFunctionBegin;
6310298fd71SBarry Smith   *B   = NULL;
6325f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscSNPrintf(keyname,sizeof(keyname),"NestBlock_%" PetscInt_FMT "-%" PetscInt_FMT "x%" PetscInt_FMT "-%" PetscInt_FMT,rbegin,rend,cbegin,cend));
6335f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B));
6348188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
6358188e55aSJed Brown 
6365f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc2(nr*nc,&a,nr*nc,&b));
63718d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
63818d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
63918d228c0SPierre Jolivet       a[i*nc + j] = vs->m[rbegin+i][cbegin+j];
64018d228c0SPierre Jolivet       b[i*nc + j] = PETSC_FALSE;
64118d228c0SPierre Jolivet     }
64218d228c0SPierre Jolivet   }
64318d228c0SPierre Jolivet   if (nc!=vs->nc&&nr!=vs->nr) {
64418d228c0SPierre Jolivet     for (i=0; i<nr; i++) {
64518d228c0SPierre Jolivet       for (j=0; j<nc; j++) {
64618d228c0SPierre Jolivet         flg = PETSC_FALSE;
64718d228c0SPierre Jolivet         for (k=0; (k<nr&&!flg); k++) {
64818d228c0SPierre Jolivet           if (a[j + k*nc]) flg = PETSC_TRUE;
64918d228c0SPierre Jolivet         }
65018d228c0SPierre Jolivet         if (flg) {
65118d228c0SPierre Jolivet           flg = PETSC_FALSE;
65218d228c0SPierre Jolivet           for (l=0; (l<nc&&!flg); l++) {
65318d228c0SPierre Jolivet             if (a[i*nc + l]) flg = PETSC_TRUE;
65418d228c0SPierre Jolivet           }
65518d228c0SPierre Jolivet         }
65618d228c0SPierre Jolivet         if (!flg) {
65718d228c0SPierre Jolivet           b[i*nc + j] = PETSC_TRUE;
6585f80ce2aSJacob Faibussowitsch           CHKERRQ(MatNestFillEmptyMat_Private(A,rbegin+i,cbegin+j,a + i*nc + j));
65918d228c0SPierre Jolivet         }
66018d228c0SPierre Jolivet       }
66118d228c0SPierre Jolivet     }
66218d228c0SPierre Jolivet   }
6635f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreateNest(PetscObjectComm((PetscObject)A),nr,nr!=vs->nr?NULL:vs->isglobal.row,nc,nc!=vs->nc?NULL:vs->isglobal.col,a,B));
66418d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
66518d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
66618d228c0SPierre Jolivet       if (b[i*nc + j]) {
6675f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDestroy(a + i*nc + j));
66818d228c0SPierre Jolivet       }
66918d228c0SPierre Jolivet     }
67018d228c0SPierre Jolivet   }
6715f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree2(a,b));
6728188e55aSJed Brown   (*B)->assembled = A->assembled;
6735f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B));
6745f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectDereference((PetscObject)*B)); /* Leave the only remaining reference in the composition */
6758188e55aSJed Brown   PetscFunctionReturn(0);
6768188e55aSJed Brown }
6778188e55aSJed Brown 
678f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
679f349c1fdSJed Brown {
680f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
68118d228c0SPierre Jolivet   PetscInt       rbegin,rend,cbegin,cend;
682f349c1fdSJed Brown 
683f349c1fdSJed Brown   PetscFunctionBegin;
6845f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestFindISRange(A,vs->nr,is->row,isrow,&rbegin,&rend));
6855f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestFindISRange(A,vs->nc,is->col,iscol,&cbegin,&cend));
68618d228c0SPierre Jolivet   if (rend == rbegin + 1 && cend == cbegin + 1) {
68718d228c0SPierre Jolivet     if (!vs->m[rbegin][cbegin]) {
6885f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFillEmptyMat_Private(A,rbegin,cbegin,vs->m[rbegin] + cbegin));
68977019fcaSJed Brown     }
69018d228c0SPierre Jolivet     *B = vs->m[rbegin][cbegin];
69118d228c0SPierre Jolivet   } else if (rbegin != -1 && cbegin != -1) {
6925f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestGetBlock_Private(A,rbegin,rend,cbegin,cend,B));
69318d228c0SPierre Jolivet   } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
694f349c1fdSJed Brown   PetscFunctionReturn(0);
695f349c1fdSJed Brown }
696f349c1fdSJed Brown 
69706a1af2fSStefano Zampini /*
69806a1af2fSStefano Zampini    TODO: This does not actually returns a submatrix we can modify
69906a1af2fSStefano Zampini */
7007dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
701f349c1fdSJed Brown {
702f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
703f349c1fdSJed Brown   Mat            sub;
704f349c1fdSJed Brown 
705f349c1fdSJed Brown   PetscFunctionBegin;
7065f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub));
707f349c1fdSJed Brown   switch (reuse) {
708f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
7095f80ce2aSJacob Faibussowitsch     if (sub) CHKERRQ(PetscObjectReference((PetscObject)sub));
710f349c1fdSJed Brown     *B = sub;
711f349c1fdSJed Brown     break;
712f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
7132c71b3e2SJacob Faibussowitsch     PetscCheckFalse(sub != *B,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
714f349c1fdSJed Brown     break;
715f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
716f349c1fdSJed Brown     break;
717511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
718511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
719f349c1fdSJed Brown   }
720f349c1fdSJed Brown   PetscFunctionReturn(0);
721f349c1fdSJed Brown }
722f349c1fdSJed Brown 
723f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
724f349c1fdSJed Brown {
725f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
726f349c1fdSJed Brown   Mat            sub;
727f349c1fdSJed Brown 
728f349c1fdSJed Brown   PetscFunctionBegin;
7295f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub));
730f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
7315f80ce2aSJacob Faibussowitsch   if (sub) CHKERRQ(PetscObjectReference((PetscObject)sub));
732f349c1fdSJed Brown   *B = sub;
733d8588912SDave May   PetscFunctionReturn(0);
734d8588912SDave May }
735d8588912SDave May 
736207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
737d8588912SDave May {
738f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
739f349c1fdSJed Brown   Mat            sub;
740d8588912SDave May 
741d8588912SDave May   PetscFunctionBegin;
7425f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub));
7432c71b3e2SJacob Faibussowitsch   PetscCheckFalse(*B != sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
744f349c1fdSJed Brown   if (sub) {
7452c71b3e2SJacob Faibussowitsch     PetscCheckFalse(((PetscObject)sub)->refct <= 1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
7465f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDestroy(B));
747d8588912SDave May   }
748d8588912SDave May   PetscFunctionReturn(0);
749d8588912SDave May }
750d8588912SDave May 
7517874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
7527874fa86SDave May {
7537874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
7547874fa86SDave May   PetscInt       i;
7557874fa86SDave May 
7567874fa86SDave May   PetscFunctionBegin;
7577874fa86SDave May   for (i=0; i<bA->nr; i++) {
758429bac76SJed Brown     Vec bv;
7595f80ce2aSJacob Faibussowitsch     CHKERRQ(VecGetSubVector(v,bA->isglobal.row[i],&bv));
7607874fa86SDave May     if (bA->m[i][i]) {
7615f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetDiagonal(bA->m[i][i],bv));
7627874fa86SDave May     } else {
7635f80ce2aSJacob Faibussowitsch       CHKERRQ(VecSet(bv,0.0));
7647874fa86SDave May     }
7655f80ce2aSJacob Faibussowitsch     CHKERRQ(VecRestoreSubVector(v,bA->isglobal.row[i],&bv));
7667874fa86SDave May   }
7677874fa86SDave May   PetscFunctionReturn(0);
7687874fa86SDave May }
7697874fa86SDave May 
7707874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
7717874fa86SDave May {
7727874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
773429bac76SJed Brown   Vec            bl,*br;
7747874fa86SDave May   PetscInt       i,j;
7757874fa86SDave May 
7767874fa86SDave May   PetscFunctionBegin;
7775f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc1(bA->nc,&br));
7782e6472ebSElliott Sales de Andrade   if (r) {
7795f80ce2aSJacob Faibussowitsch     for (j=0; j<bA->nc; j++) CHKERRQ(VecGetSubVector(r,bA->isglobal.col[j],&br[j]));
7802e6472ebSElliott Sales de Andrade   }
7812e6472ebSElliott Sales de Andrade   bl = NULL;
7827874fa86SDave May   for (i=0; i<bA->nr; i++) {
7832e6472ebSElliott Sales de Andrade     if (l) {
7845f80ce2aSJacob Faibussowitsch       CHKERRQ(VecGetSubVector(l,bA->isglobal.row[i],&bl));
7852e6472ebSElliott Sales de Andrade     }
7867874fa86SDave May     for (j=0; j<bA->nc; j++) {
7877874fa86SDave May       if (bA->m[i][j]) {
7885f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDiagonalScale(bA->m[i][j],bl,br[j]));
7897874fa86SDave May       }
7907874fa86SDave May     }
7912e6472ebSElliott Sales de Andrade     if (l) {
7925f80ce2aSJacob Faibussowitsch       CHKERRQ(VecRestoreSubVector(l,bA->isglobal.row[i],&bl));
7937874fa86SDave May     }
7942e6472ebSElliott Sales de Andrade   }
7952e6472ebSElliott Sales de Andrade   if (r) {
7965f80ce2aSJacob Faibussowitsch     for (j=0; j<bA->nc; j++) CHKERRQ(VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]));
7972e6472ebSElliott Sales de Andrade   }
7985f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(br));
7997874fa86SDave May   PetscFunctionReturn(0);
8007874fa86SDave May }
8017874fa86SDave May 
802a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
803a061e289SJed Brown {
804a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
805a061e289SJed Brown   PetscInt       i,j;
806a061e289SJed Brown 
807a061e289SJed Brown   PetscFunctionBegin;
808a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
809a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
810a061e289SJed Brown       if (bA->m[i][j]) {
8115f80ce2aSJacob Faibussowitsch         CHKERRQ(MatScale(bA->m[i][j],a));
812a061e289SJed Brown       }
813a061e289SJed Brown     }
814a061e289SJed Brown   }
815a061e289SJed Brown   PetscFunctionReturn(0);
816a061e289SJed Brown }
817a061e289SJed Brown 
818a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
819a061e289SJed Brown {
820a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
821a061e289SJed Brown   PetscInt       i;
82206a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
823a061e289SJed Brown 
824a061e289SJed Brown   PetscFunctionBegin;
825a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
82606a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
8272c71b3e2SJacob Faibussowitsch     PetscCheckFalse(!bA->m[i][i],PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%" PetscInt_FMT ",%" PetscInt_FMT ")",i,i);
8285f80ce2aSJacob Faibussowitsch     CHKERRQ(MatShift(bA->m[i][i],a));
8295f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetNonzeroState(bA->m[i][i],&subnnzstate));
83006a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
83106a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
832a061e289SJed Brown   }
83306a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
834a061e289SJed Brown   PetscFunctionReturn(0);
835a061e289SJed Brown }
836a061e289SJed Brown 
83713135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
83813135bc6SAlex Fikl {
83913135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
84013135bc6SAlex Fikl   PetscInt       i;
84106a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
84213135bc6SAlex Fikl 
84313135bc6SAlex Fikl   PetscFunctionBegin;
84413135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
84506a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
84613135bc6SAlex Fikl     Vec              bv;
8475f80ce2aSJacob Faibussowitsch     CHKERRQ(VecGetSubVector(D,bA->isglobal.row[i],&bv));
84813135bc6SAlex Fikl     if (bA->m[i][i]) {
8495f80ce2aSJacob Faibussowitsch       CHKERRQ(MatDiagonalSet(bA->m[i][i],bv,is));
8505f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetNonzeroState(bA->m[i][i],&subnnzstate));
85113135bc6SAlex Fikl     }
8525f80ce2aSJacob Faibussowitsch     CHKERRQ(VecRestoreSubVector(D,bA->isglobal.row[i],&bv));
85306a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
85406a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
85513135bc6SAlex Fikl   }
85606a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
85713135bc6SAlex Fikl   PetscFunctionReturn(0);
85813135bc6SAlex Fikl }
85913135bc6SAlex Fikl 
860f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
861f8170845SAlex Fikl {
862f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
863f8170845SAlex Fikl   PetscInt       i,j;
864f8170845SAlex Fikl 
865f8170845SAlex Fikl   PetscFunctionBegin;
866f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
867f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
868f8170845SAlex Fikl       if (bA->m[i][j]) {
8695f80ce2aSJacob Faibussowitsch         CHKERRQ(MatSetRandom(bA->m[i][j],rctx));
870f8170845SAlex Fikl       }
871f8170845SAlex Fikl     }
872f8170845SAlex Fikl   }
873f8170845SAlex Fikl   PetscFunctionReturn(0);
874f8170845SAlex Fikl }
875f8170845SAlex Fikl 
8762a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
877d8588912SDave May {
878d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
879d8588912SDave May   Vec            *L,*R;
880d8588912SDave May   MPI_Comm       comm;
881d8588912SDave May   PetscInt       i,j;
882d8588912SDave May 
883d8588912SDave May   PetscFunctionBegin;
8845f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectGetComm((PetscObject)A,&comm));
885d8588912SDave May   if (right) {
886d8588912SDave May     /* allocate R */
8875f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(bA->nc, &R));
888d8588912SDave May     /* Create the right vectors */
889d8588912SDave May     for (j=0; j<bA->nc; j++) {
890d8588912SDave May       for (i=0; i<bA->nr; i++) {
891d8588912SDave May         if (bA->m[i][j]) {
8925f80ce2aSJacob Faibussowitsch           CHKERRQ(MatCreateVecs(bA->m[i][j],&R[j],NULL));
893d8588912SDave May           break;
894d8588912SDave May         }
895d8588912SDave May       }
8962c71b3e2SJacob Faibussowitsch       PetscCheckFalse(i==bA->nr,PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
897d8588912SDave May     }
8985f80ce2aSJacob Faibussowitsch     CHKERRQ(VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right));
899d8588912SDave May     /* hand back control to the nest vector */
900d8588912SDave May     for (j=0; j<bA->nc; j++) {
9015f80ce2aSJacob Faibussowitsch       CHKERRQ(VecDestroy(&R[j]));
902d8588912SDave May     }
9035f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscFree(R));
904d8588912SDave May   }
905d8588912SDave May 
906d8588912SDave May   if (left) {
907d8588912SDave May     /* allocate L */
9085f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(bA->nr, &L));
909d8588912SDave May     /* Create the left vectors */
910d8588912SDave May     for (i=0; i<bA->nr; i++) {
911d8588912SDave May       for (j=0; j<bA->nc; j++) {
912d8588912SDave May         if (bA->m[i][j]) {
9135f80ce2aSJacob Faibussowitsch           CHKERRQ(MatCreateVecs(bA->m[i][j],NULL,&L[i]));
914d8588912SDave May           break;
915d8588912SDave May         }
916d8588912SDave May       }
9172c71b3e2SJacob Faibussowitsch       PetscCheckFalse(j==bA->nc,PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
918d8588912SDave May     }
919d8588912SDave May 
9205f80ce2aSJacob Faibussowitsch     CHKERRQ(VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left));
921d8588912SDave May     for (i=0; i<bA->nr; i++) {
9225f80ce2aSJacob Faibussowitsch       CHKERRQ(VecDestroy(&L[i]));
923d8588912SDave May     }
924d8588912SDave May 
9255f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscFree(L));
926d8588912SDave May   }
927d8588912SDave May   PetscFunctionReturn(0);
928d8588912SDave May }
929d8588912SDave May 
930207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
931d8588912SDave May {
932d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
93329e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
934d8588912SDave May   PetscInt       i,j;
935d8588912SDave May 
936d8588912SDave May   PetscFunctionBegin;
9375f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii));
938d8588912SDave May   if (isascii) {
939d8588912SDave May 
9405f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL));
9415f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscViewerASCIIPrintf(viewer,"Matrix object: \n"));
9425f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscViewerASCIIPushTab(viewer));
9435f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscViewerASCIIPrintf(viewer, "type=nest, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT " \n",bA->nr,bA->nc));
944d8588912SDave May 
9455f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscViewerASCIIPrintf(viewer,"MatNest structure: \n"));
946d8588912SDave May     for (i=0; i<bA->nr; i++) {
947d8588912SDave May       for (j=0; j<bA->nc; j++) {
94819fd82e9SBarry Smith         MatType   type;
949270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
950d8588912SDave May         PetscInt  NR,NC;
951d8588912SDave May         PetscBool isNest = PETSC_FALSE;
952d8588912SDave May 
953d8588912SDave May         if (!bA->m[i][j]) {
9545f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : NULL \n",i,j));
955d8588912SDave May           continue;
956d8588912SDave May         }
9575f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetSize(bA->m[i][j],&NR,&NC));
9585f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetType(bA->m[i][j], &type));
9595f80ce2aSJacob Faibussowitsch         if (((PetscObject)bA->m[i][j])->name) CHKERRQ(PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name));
9605f80ce2aSJacob Faibussowitsch         if (((PetscObject)bA->m[i][j])->prefix) CHKERRQ(PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix));
9615f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest));
962d8588912SDave May 
9635f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscViewerASCIIPrintf(viewer,"(%" PetscInt_FMT ",%" PetscInt_FMT ") : %s%stype=%s, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT " \n",i,j,name,prefix,type,NR,NC));
964d8588912SDave May 
96529e60adbSStefano Zampini         if (isNest || viewSub) {
9665f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscViewerASCIIPushTab(viewer));  /* push1 */
9675f80ce2aSJacob Faibussowitsch           CHKERRQ(MatView(bA->m[i][j],viewer));
9685f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscViewerASCIIPopTab(viewer));    /* pop1 */
969d8588912SDave May         }
970d8588912SDave May       }
971d8588912SDave May     }
9725f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscViewerASCIIPopTab(viewer));    /* pop0 */
973d8588912SDave May   }
974d8588912SDave May   PetscFunctionReturn(0);
975d8588912SDave May }
976d8588912SDave May 
977207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
978d8588912SDave May {
979d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
980d8588912SDave May   PetscInt       i,j;
981d8588912SDave May 
982d8588912SDave May   PetscFunctionBegin;
983d8588912SDave May   for (i=0; i<bA->nr; i++) {
984d8588912SDave May     for (j=0; j<bA->nc; j++) {
985d8588912SDave May       if (!bA->m[i][j]) continue;
9865f80ce2aSJacob Faibussowitsch       CHKERRQ(MatZeroEntries(bA->m[i][j]));
987d8588912SDave May     }
988d8588912SDave May   }
989d8588912SDave May   PetscFunctionReturn(0);
990d8588912SDave May }
991d8588912SDave May 
992c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
993c222c20dSDavid Ham {
994c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
995c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
99606a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
997c222c20dSDavid Ham 
998c222c20dSDavid Ham   PetscFunctionBegin;
9992c71b3e2SJacob Faibussowitsch   PetscCheckFalse(nr != bB->nr || nc != bB->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") to a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")",bB->nr,bB->nc,nr,nc);
1000c222c20dSDavid Ham   for (i=0; i<nr; i++) {
1001c222c20dSDavid Ham     for (j=0; j<nc; j++) {
100206a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
100346a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
10045f80ce2aSJacob Faibussowitsch         CHKERRQ(MatCopy(bA->m[i][j],bB->m[i][j],str));
10052c71b3e2SJacob Faibussowitsch       } else PetscCheckFalse(bA->m[i][j] || bB->m[i][j],PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT,i,j);
10065f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetNonzeroState(bB->m[i][j],&subnnzstate));
100706a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate);
100806a1af2fSStefano Zampini       bB->nnzstate[i*nc+j] = subnnzstate;
1009c222c20dSDavid Ham     }
1010c222c20dSDavid Ham   }
101106a1af2fSStefano Zampini   if (nnzstate) B->nonzerostate++;
1012c222c20dSDavid Ham   PetscFunctionReturn(0);
1013c222c20dSDavid Ham }
1014c222c20dSDavid Ham 
10156e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
10166e76ffeaSPierre Jolivet {
10176e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
10186e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
101906a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
10206e76ffeaSPierre Jolivet 
10216e76ffeaSPierre Jolivet   PetscFunctionBegin;
10222c71b3e2SJacob Faibussowitsch   PetscCheckFalse(nr != bX->nr || nc != bX->nc,PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") with a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")",bX->nr,bX->nc,nr,nc);
10236e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
10246e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
102506a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
10266e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
10275f80ce2aSJacob Faibussowitsch         CHKERRQ(MatAXPY(bY->m[i][j],a,bX->m[i][j],str));
1028c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
1029c066aebcSStefano Zampini         Mat M;
1030c066aebcSStefano Zampini 
10312c71b3e2SJacob Faibussowitsch         PetscCheckFalse(str != DIFFERENT_NONZERO_PATTERN,PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT ". Use DIFFERENT_NONZERO_PATTERN",i,j);
10325f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M));
10335f80ce2aSJacob Faibussowitsch         CHKERRQ(MatNestSetSubMat(Y,i,j,M));
10345f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDestroy(&M));
1035c066aebcSStefano Zampini       }
10365f80ce2aSJacob Faibussowitsch       if (bY->m[i][j]) CHKERRQ(MatGetNonzeroState(bY->m[i][j],&subnnzstate));
103706a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate);
103806a1af2fSStefano Zampini       bY->nnzstate[i*nc+j] = subnnzstate;
10396e76ffeaSPierre Jolivet     }
10406e76ffeaSPierre Jolivet   }
104106a1af2fSStefano Zampini   if (nnzstate) Y->nonzerostate++;
10426e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
10436e76ffeaSPierre Jolivet }
10446e76ffeaSPierre Jolivet 
1045207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
1046d8588912SDave May {
1047d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1048841e96a3SJed Brown   Mat            *b;
1049841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1050d8588912SDave May 
1051d8588912SDave May   PetscFunctionBegin;
10525f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nr*nc,&b));
1053841e96a3SJed Brown   for (i=0; i<nr; i++) {
1054841e96a3SJed Brown     for (j=0; j<nc; j++) {
1055841e96a3SJed Brown       if (bA->m[i][j]) {
10565f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDuplicate(bA->m[i][j],op,&b[i*nc+j]));
1057841e96a3SJed Brown       } else {
10580298fd71SBarry Smith         b[i*nc+j] = NULL;
1059d8588912SDave May       }
1060d8588912SDave May     }
1061d8588912SDave May   }
10625f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B));
1063841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
1064841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
10655f80ce2aSJacob Faibussowitsch     CHKERRQ(MatDestroy(&b[i]));
1066d8588912SDave May   }
10675f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(b));
1068d8588912SDave May 
10695f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY));
10705f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY));
1071d8588912SDave May   PetscFunctionReturn(0);
1072d8588912SDave May }
1073d8588912SDave May 
1074d8588912SDave May /* nest api */
1075d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
1076d8588912SDave May {
1077d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
10785fd66863SKarl Rupp 
1079d8588912SDave May   PetscFunctionBegin;
10802c71b3e2SJacob Faibussowitsch   PetscCheckFalse(idxm >= bA->nr,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,idxm,bA->nr-1);
10812c71b3e2SJacob Faibussowitsch   PetscCheckFalse(jdxm >= bA->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT,jdxm,bA->nc-1);
1082d8588912SDave May   *mat = bA->m[idxm][jdxm];
1083d8588912SDave May   PetscFunctionReturn(0);
1084d8588912SDave May }
1085d8588912SDave May 
10869ba0d327SJed Brown /*@
1087d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
1088d8588912SDave May 
1089d8588912SDave May  Not collective
1090d8588912SDave May 
1091d8588912SDave May  Input Parameters:
1092629881c0SJed Brown +   A  - nest matrix
1093d8588912SDave May .   idxm - index of the matrix within the nest matrix
1094629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
1095d8588912SDave May 
1096d8588912SDave May  Output Parameter:
1097d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
1098d8588912SDave May 
1099d8588912SDave May  Level: developer
1100d8588912SDave May 
1101bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(),
110279798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
1103d8588912SDave May @*/
11047087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
1105d8588912SDave May {
1106d8588912SDave May   PetscFunctionBegin;
11075f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub)));
1108d8588912SDave May   PetscFunctionReturn(0);
1109d8588912SDave May }
1110d8588912SDave May 
11110782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
11120782ca92SJed Brown {
11130782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
11140782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
11150782ca92SJed Brown 
11160782ca92SJed Brown   PetscFunctionBegin;
11172c71b3e2SJacob Faibussowitsch   PetscCheckFalse(idxm >= bA->nr,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,idxm,bA->nr-1);
11182c71b3e2SJacob Faibussowitsch   PetscCheckFalse(jdxm >= bA->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT,jdxm,bA->nc-1);
11195f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetLocalSize(mat,&m,&n));
11205f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(mat,&M,&N));
11215f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetLocalSize(bA->isglobal.row[idxm],&mi));
11225f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetSize(bA->isglobal.row[idxm],&Mi));
11235f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetLocalSize(bA->isglobal.col[jdxm],&ni));
11245f80ce2aSJacob Faibussowitsch   CHKERRQ(ISGetSize(bA->isglobal.col[jdxm],&Ni));
11252c71b3e2SJacob Faibussowitsch   PetscCheckFalse(M != Mi || N != Ni,PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")",M,N,Mi,Ni);
11262c71b3e2SJacob Faibussowitsch   PetscCheckFalse(m != mi || n != ni,PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")",m,n,mi,ni);
112726fbe8dcSKarl Rupp 
112806a1af2fSStefano Zampini   /* do not increase object state */
112906a1af2fSStefano Zampini   if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0);
113006a1af2fSStefano Zampini 
11315f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectReference((PetscObject)mat));
11325f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&bA->m[idxm][jdxm]));
11330782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
11345f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectStateIncrease((PetscObject)A));
11355f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]));
113606a1af2fSStefano Zampini   A->nonzerostate++;
11370782ca92SJed Brown   PetscFunctionReturn(0);
11380782ca92SJed Brown }
11390782ca92SJed Brown 
11409ba0d327SJed Brown /*@
11410782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
11420782ca92SJed Brown 
11430782ca92SJed Brown  Logically collective on the submatrix communicator
11440782ca92SJed Brown 
11450782ca92SJed Brown  Input Parameters:
11460782ca92SJed Brown +   A  - nest matrix
11470782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
11480782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
11490782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
11500782ca92SJed Brown 
11510782ca92SJed Brown  Notes:
11520782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
11530782ca92SJed Brown 
11540782ca92SJed Brown  This increments the reference count of the submatrix.
11550782ca92SJed Brown 
11560782ca92SJed Brown  Level: developer
11570782ca92SJed Brown 
1158bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
115979798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
11600782ca92SJed Brown @*/
11610782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
11620782ca92SJed Brown {
11630782ca92SJed Brown   PetscFunctionBegin;
11645f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub)));
11650782ca92SJed Brown   PetscFunctionReturn(0);
11660782ca92SJed Brown }
11670782ca92SJed Brown 
1168d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1169d8588912SDave May {
1170d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
11715fd66863SKarl Rupp 
1172d8588912SDave May   PetscFunctionBegin;
117326fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
117426fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
117526fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1176d8588912SDave May   PetscFunctionReturn(0);
1177d8588912SDave May }
1178d8588912SDave May 
1179d8588912SDave May /*@C
1180d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1181d8588912SDave May 
1182d8588912SDave May  Not collective
1183d8588912SDave May 
1184f899ff85SJose E. Roman  Input Parameter:
1185629881c0SJed Brown .   A  - nest matrix
1186d8588912SDave May 
1187d8d19677SJose E. Roman  Output Parameters:
1188629881c0SJed Brown +   M - number of rows in the nest matrix
1189d8588912SDave May .   N - number of cols in the nest matrix
1190629881c0SJed Brown -   mat - 2d array of matrices
1191d8588912SDave May 
1192d8588912SDave May  Notes:
1193d8588912SDave May 
1194d8588912SDave May  The user should not free the array mat.
1195d8588912SDave May 
1196351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1197351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1198351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1199351962e3SVincent Le Chenadec 
1200d8588912SDave May  Level: developer
1201d8588912SDave May 
1202bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
120379798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1204d8588912SDave May @*/
12057087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1206d8588912SDave May {
1207d8588912SDave May   PetscFunctionBegin;
12085f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat)));
1209d8588912SDave May   PetscFunctionReturn(0);
1210d8588912SDave May }
1211d8588912SDave May 
12127087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1213d8588912SDave May {
1214d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1215d8588912SDave May 
1216d8588912SDave May   PetscFunctionBegin;
121726fbe8dcSKarl Rupp   if (M) *M = bA->nr;
121826fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1219d8588912SDave May   PetscFunctionReturn(0);
1220d8588912SDave May }
1221d8588912SDave May 
12229ba0d327SJed Brown /*@
1223d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1224d8588912SDave May 
1225d8588912SDave May  Not collective
1226d8588912SDave May 
1227f899ff85SJose E. Roman  Input Parameter:
1228d8588912SDave May .   A  - nest matrix
1229d8588912SDave May 
1230d8d19677SJose E. Roman  Output Parameters:
1231629881c0SJed Brown +   M - number of rows in the nested mat
1232629881c0SJed Brown -   N - number of cols in the nested mat
1233d8588912SDave May 
1234d8588912SDave May  Notes:
1235d8588912SDave May 
1236d8588912SDave May  Level: developer
1237d8588912SDave May 
1238bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(),
123979798668SBarry Smith           MatNestGetISs()
1240d8588912SDave May @*/
12417087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1242d8588912SDave May {
1243d8588912SDave May   PetscFunctionBegin;
12445f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N)));
1245d8588912SDave May   PetscFunctionReturn(0);
1246d8588912SDave May }
1247d8588912SDave May 
1248f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1249900e7ff2SJed Brown {
1250900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1251900e7ff2SJed Brown   PetscInt i;
1252900e7ff2SJed Brown 
1253900e7ff2SJed Brown   PetscFunctionBegin;
1254900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1255900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1256900e7ff2SJed Brown   PetscFunctionReturn(0);
1257900e7ff2SJed Brown }
1258900e7ff2SJed Brown 
12593a4d7b9aSSatish Balay /*@C
1260900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1261900e7ff2SJed Brown 
1262900e7ff2SJed Brown  Not collective
1263900e7ff2SJed Brown 
1264f899ff85SJose E. Roman  Input Parameter:
1265900e7ff2SJed Brown .   A  - nest matrix
1266900e7ff2SJed Brown 
1267d8d19677SJose E. Roman  Output Parameters:
1268900e7ff2SJed Brown +   rows - array of row index sets
1269900e7ff2SJed Brown -   cols - array of column index sets
1270900e7ff2SJed Brown 
1271900e7ff2SJed Brown  Level: advanced
1272900e7ff2SJed Brown 
1273900e7ff2SJed Brown  Notes:
1274900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1275900e7ff2SJed Brown 
127679798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1277bb97c47cSPierre Jolivet           MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats()
1278900e7ff2SJed Brown @*/
1279900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1280900e7ff2SJed Brown {
1281900e7ff2SJed Brown   PetscFunctionBegin;
1282900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
12835f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols)));
1284900e7ff2SJed Brown   PetscFunctionReturn(0);
1285900e7ff2SJed Brown }
1286900e7ff2SJed Brown 
1287f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1288900e7ff2SJed Brown {
1289900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1290900e7ff2SJed Brown   PetscInt i;
1291900e7ff2SJed Brown 
1292900e7ff2SJed Brown   PetscFunctionBegin;
1293900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1294900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1295900e7ff2SJed Brown   PetscFunctionReturn(0);
1296900e7ff2SJed Brown }
1297900e7ff2SJed Brown 
1298900e7ff2SJed Brown /*@C
1299900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1300900e7ff2SJed Brown 
1301900e7ff2SJed Brown  Not collective
1302900e7ff2SJed Brown 
1303f899ff85SJose E. Roman  Input Parameter:
1304900e7ff2SJed Brown .   A  - nest matrix
1305900e7ff2SJed Brown 
1306d8d19677SJose E. Roman  Output Parameters:
13070298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
13080298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1309900e7ff2SJed Brown 
1310900e7ff2SJed Brown  Level: advanced
1311900e7ff2SJed Brown 
1312900e7ff2SJed Brown  Notes:
1313900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1314900e7ff2SJed Brown 
1315bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(),
131679798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1317900e7ff2SJed Brown @*/
1318900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1319900e7ff2SJed Brown {
1320900e7ff2SJed Brown   PetscFunctionBegin;
1321900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
13225f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols)));
1323900e7ff2SJed Brown   PetscFunctionReturn(0);
1324900e7ff2SJed Brown }
1325900e7ff2SJed Brown 
132619fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1327207556f9SJed Brown {
1328207556f9SJed Brown   PetscBool      flg;
1329207556f9SJed Brown 
1330207556f9SJed Brown   PetscFunctionBegin;
13315f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscStrcmp(vtype,VECNEST,&flg));
1332207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
13332a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
133412b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1335207556f9SJed Brown   PetscFunctionReturn(0);
1336207556f9SJed Brown }
1337207556f9SJed Brown 
1338207556f9SJed Brown /*@C
13392a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1340207556f9SJed Brown 
1341207556f9SJed Brown  Not collective
1342207556f9SJed Brown 
1343207556f9SJed Brown  Input Parameters:
1344207556f9SJed Brown +  A  - nest matrix
1345207556f9SJed Brown -  vtype - type to use for creating vectors
1346207556f9SJed Brown 
1347207556f9SJed Brown  Notes:
1348207556f9SJed Brown 
1349207556f9SJed Brown  Level: developer
1350207556f9SJed Brown 
1351bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest()
1352207556f9SJed Brown @*/
135319fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1354207556f9SJed Brown {
1355207556f9SJed Brown   PetscFunctionBegin;
13565f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype)));
1357207556f9SJed Brown   PetscFunctionReturn(0);
1358207556f9SJed Brown }
1359207556f9SJed Brown 
1360c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1361d8588912SDave May {
1362c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1363c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
136488ffe2e8SJose E. Roman   PetscBool      cong,isstd,sametype=PETSC_FALSE;
136588ffe2e8SJose E. Roman   VecType        vtype,type;
1366d8588912SDave May 
1367d8588912SDave May   PetscFunctionBegin;
13685f80ce2aSJacob Faibussowitsch   CHKERRQ(MatReset_Nest(A));
136906a1af2fSStefano Zampini 
1370c8883902SJed Brown   s->nr = nr;
1371c8883902SJed Brown   s->nc = nc;
1372d8588912SDave May 
1373c8883902SJed Brown   /* Create space for submatrices */
13745f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nr,&s->m));
1375c8883902SJed Brown   for (i=0; i<nr; i++) {
13765f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(nc,&s->m[i]));
1377d8588912SDave May   }
1378c8883902SJed Brown   for (i=0; i<nr; i++) {
1379c8883902SJed Brown     for (j=0; j<nc; j++) {
1380c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1381c8883902SJed Brown       if (a[i*nc+j]) {
13825f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscObjectReference((PetscObject)a[i*nc+j]));
1383d8588912SDave May       }
1384d8588912SDave May     }
1385d8588912SDave May   }
13865f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetVecType(A,&vtype));
13875f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscStrcmp(vtype,VECSTANDARD,&isstd));
138888ffe2e8SJose E. Roman   if (isstd) {
138988ffe2e8SJose E. Roman     /* check if all blocks have the same vectype */
139088ffe2e8SJose E. Roman     vtype = NULL;
139188ffe2e8SJose E. Roman     for (i=0; i<nr; i++) {
139288ffe2e8SJose E. Roman       for (j=0; j<nc; j++) {
139388ffe2e8SJose E. Roman         if (a[i*nc+j]) {
139488ffe2e8SJose E. Roman           if (!vtype) {  /* first visited block */
13955f80ce2aSJacob Faibussowitsch             CHKERRQ(MatGetVecType(a[i*nc+j],&vtype));
139688ffe2e8SJose E. Roman             sametype = PETSC_TRUE;
139788ffe2e8SJose E. Roman           } else if (sametype) {
13985f80ce2aSJacob Faibussowitsch             CHKERRQ(MatGetVecType(a[i*nc+j],&type));
13995f80ce2aSJacob Faibussowitsch             CHKERRQ(PetscStrcmp(vtype,type,&sametype));
140088ffe2e8SJose E. Roman           }
140188ffe2e8SJose E. Roman         }
140288ffe2e8SJose E. Roman       }
140388ffe2e8SJose E. Roman     }
140488ffe2e8SJose E. Roman     if (sametype) {  /* propagate vectype */
14055f80ce2aSJacob Faibussowitsch       CHKERRQ(MatSetVecType(A,vtype));
140688ffe2e8SJose E. Roman     }
140788ffe2e8SJose E. Roman   }
1408d8588912SDave May 
14095f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col));
1410d8588912SDave May 
14115f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nr,&s->row_len));
14125f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nc,&s->col_len));
1413c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1414c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1415d8588912SDave May 
14165f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc1(nr*nc,&s->nnzstate));
141706a1af2fSStefano Zampini   for (i=0; i<nr; i++) {
141806a1af2fSStefano Zampini     for (j=0; j<nc; j++) {
141906a1af2fSStefano Zampini       if (s->m[i][j]) {
14205f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]));
142106a1af2fSStefano Zampini       }
142206a1af2fSStefano Zampini     }
142306a1af2fSStefano Zampini   }
142406a1af2fSStefano Zampini 
14255f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestGetSizes_Private(A,&m,&n,&M,&N));
1426d8588912SDave May 
14275f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetSize(A->rmap,M));
14285f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetLocalSize(A->rmap,m));
14295f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetSize(A->cmap,N));
14305f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetLocalSize(A->cmap,n));
1431c8883902SJed Brown 
14325f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetUp(A->rmap));
14335f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscLayoutSetUp(A->cmap));
1434c8883902SJed Brown 
143506a1af2fSStefano Zampini   /* disable operations that are not supported for non-square matrices,
143606a1af2fSStefano Zampini      or matrices for which is_row != is_col  */
14375f80ce2aSJacob Faibussowitsch   CHKERRQ(MatHasCongruentLayouts(A,&cong));
143806a1af2fSStefano Zampini   if (cong && nr != nc) cong = PETSC_FALSE;
143906a1af2fSStefano Zampini   if (cong) {
144006a1af2fSStefano Zampini     for (i = 0; cong && i < nr; i++) {
14415f80ce2aSJacob Faibussowitsch       CHKERRQ(ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong));
144206a1af2fSStefano Zampini     }
144306a1af2fSStefano Zampini   }
144406a1af2fSStefano Zampini   if (!cong) {
1445381b8e50SStefano Zampini     A->ops->missingdiagonal = NULL;
144606a1af2fSStefano Zampini     A->ops->getdiagonal     = NULL;
144706a1af2fSStefano Zampini     A->ops->shift           = NULL;
144806a1af2fSStefano Zampini     A->ops->diagonalset     = NULL;
144906a1af2fSStefano Zampini   }
145006a1af2fSStefano Zampini 
14515f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc2(nr,&s->left,nc,&s->right));
14525f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectStateIncrease((PetscObject)A));
145306a1af2fSStefano Zampini   A->nonzerostate++;
1454d8588912SDave May   PetscFunctionReturn(0);
1455d8588912SDave May }
1456d8588912SDave May 
1457c8883902SJed Brown /*@
1458c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1459c8883902SJed Brown 
1460c8883902SJed Brown    Collective on Mat
1461c8883902SJed Brown 
1462d8d19677SJose E. Roman    Input Parameters:
1463ffd6319bSRichard Tran Mills +  A - nested matrix
1464c8883902SJed Brown .  nr - number of nested row blocks
14650298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1466c8883902SJed Brown .  nc - number of nested column blocks
14670298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
14680298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1469c8883902SJed Brown 
147006a1af2fSStefano Zampini    Notes: this always resets any submatrix information previously set
147106a1af2fSStefano Zampini 
1472c8883902SJed Brown    Level: advanced
1473c8883902SJed Brown 
147479798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1475c8883902SJed Brown @*/
1476c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1477c8883902SJed Brown {
147806a1af2fSStefano Zampini   PetscInt       i;
1479c8883902SJed Brown 
1480c8883902SJed Brown   PetscFunctionBegin;
1481c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
14822c71b3e2SJacob Faibussowitsch   PetscCheckFalse(nr < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1483c8883902SJed Brown   if (nr && is_row) {
1484c8883902SJed Brown     PetscValidPointer(is_row,3);
1485c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1486c8883902SJed Brown   }
14872c71b3e2SJacob Faibussowitsch   PetscCheckFalse(nc < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
14881664e352SJed Brown   if (nc && is_col) {
1489c8883902SJed Brown     PetscValidPointer(is_col,5);
14909b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1491c8883902SJed Brown   }
149206a1af2fSStefano Zampini   if (nr*nc > 0) PetscValidPointer(a,6);
14935f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a)));
1494c8883902SJed Brown   PetscFunctionReturn(0);
1495c8883902SJed Brown }
1496d8588912SDave May 
149745b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
149877019fcaSJed Brown {
149977019fcaSJed Brown   PetscBool      flg;
150077019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
150177019fcaSJed Brown 
150277019fcaSJed Brown   PetscFunctionBegin;
1503aea6d515SStefano Zampini   *ltog = NULL;
150477019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
150577019fcaSJed Brown     if (islocal[i]) {
15065f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(islocal[i],&mi));
150777019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
150877019fcaSJed Brown     } else {
15095f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(isglobal[i],&mi));
151077019fcaSJed Brown     }
151177019fcaSJed Brown     m += mi;
151277019fcaSJed Brown   }
1513aea6d515SStefano Zampini   if (!flg) PetscFunctionReturn(0);
1514aea6d515SStefano Zampini 
15155f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(m,&ix));
1516165cd838SBarry Smith   for (i=0,m=0; i<n; i++) {
15170298fd71SBarry Smith     ISLocalToGlobalMapping smap = NULL;
1518e108cb99SStefano Zampini     Mat                    sub = NULL;
1519f6d38dbbSStefano Zampini     PetscSF                sf;
1520f6d38dbbSStefano Zampini     PetscLayout            map;
1521aea6d515SStefano Zampini     const PetscInt         *ix2;
152277019fcaSJed Brown 
1523165cd838SBarry Smith     if (!colflg) {
15245f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatRow(A,i,&sub));
152577019fcaSJed Brown     } else {
15265f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatCol(A,i,&sub));
152777019fcaSJed Brown     }
1528191fd14bSBarry Smith     if (sub) {
1529191fd14bSBarry Smith       if (!colflg) {
15305f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetLocalToGlobalMapping(sub,&smap,NULL));
1531191fd14bSBarry Smith       } else {
15325f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetLocalToGlobalMapping(sub,NULL,&smap));
1533191fd14bSBarry Smith       }
1534191fd14bSBarry Smith     }
153577019fcaSJed Brown     /*
153677019fcaSJed Brown        Now we need to extract the monolithic global indices that correspond to the given split global indices.
153777019fcaSJed Brown        In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
153877019fcaSJed Brown     */
15395f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetIndices(isglobal[i],&ix2));
1540aea6d515SStefano Zampini     if (islocal[i]) {
1541aea6d515SStefano Zampini       PetscInt *ilocal,*iremote;
1542aea6d515SStefano Zampini       PetscInt mil,nleaves;
1543aea6d515SStefano Zampini 
15445f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(islocal[i],&mi));
1545*28b400f6SJacob Faibussowitsch       PetscCheck(smap,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map");
1546aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = j;
15475f80ce2aSJacob Faibussowitsch       CHKERRQ(ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m));
1548aea6d515SStefano Zampini 
1549aea6d515SStefano Zampini       /* PetscSFSetGraphLayout does not like negative indices */
15505f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscMalloc2(mi,&ilocal,mi,&iremote));
1551aea6d515SStefano Zampini       for (j=0, nleaves = 0; j<mi; j++) {
1552aea6d515SStefano Zampini         if (ix[m+j] < 0) continue;
1553aea6d515SStefano Zampini         ilocal[nleaves]  = j;
1554aea6d515SStefano Zampini         iremote[nleaves] = ix[m+j];
1555aea6d515SStefano Zampini         nleaves++;
1556aea6d515SStefano Zampini       }
15575f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(isglobal[i],&mil));
15585f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFCreate(PetscObjectComm((PetscObject)A),&sf));
15595f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map));
15605f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscLayoutSetLocalSize(map,mil));
15615f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscLayoutSetUp(map));
15625f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote));
15635f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscLayoutDestroy(&map));
15645f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE));
15655f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE));
15665f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFDestroy(&sf));
15675f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscFree2(ilocal,iremote));
1568aea6d515SStefano Zampini     } else {
15695f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(isglobal[i],&mi));
1570aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = ix2[i];
1571aea6d515SStefano Zampini     }
15725f80ce2aSJacob Faibussowitsch     CHKERRQ(ISRestoreIndices(isglobal[i],&ix2));
157377019fcaSJed Brown     m   += mi;
157477019fcaSJed Brown   }
15755f80ce2aSJacob Faibussowitsch   CHKERRQ(ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog));
157677019fcaSJed Brown   PetscFunctionReturn(0);
157777019fcaSJed Brown }
157877019fcaSJed Brown 
1579d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1580d8588912SDave May /*
1581d8588912SDave May   nprocessors = NP
1582d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1583d8588912SDave May        proc 0: => (g_0,h_0,)
1584d8588912SDave May        proc 1: => (g_1,h_1,)
1585d8588912SDave May        ...
1586d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1587d8588912SDave May 
1588d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1589d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1590d8588912SDave May 
1591d8588912SDave May             proc 0:
1592d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1593d8588912SDave May             proc 1:
1594d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1595d8588912SDave May 
1596d8588912SDave May             proc NP-1:
1597d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1598d8588912SDave May */
1599841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1600d8588912SDave May {
1601e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
16028188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
16030298fd71SBarry Smith   Mat            sub = NULL;
1604d8588912SDave May 
1605d8588912SDave May   PetscFunctionBegin;
16065f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nr,&vs->isglobal.row));
16075f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(nc,&vs->isglobal.col));
1608d8588912SDave May   if (is_row) { /* valid IS is passed in */
1609a5b23f4aSJose E. Roman     /* refs on is[] are incremented */
1610e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
16115f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectReference((PetscObject)is_row[i]));
161226fbe8dcSKarl Rupp 
1613e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1614d8588912SDave May     }
16152ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
16168188e55aSJed Brown     nsum = 0;
16178188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
16185f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatRow(A,i,&sub));
1619*28b400f6SJacob Faibussowitsch       PetscCheck(sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %" PetscInt_FMT,i);
16205f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetLocalSize(sub,&n,NULL));
16212c71b3e2SJacob Faibussowitsch       PetscCheckFalse(n < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16228188e55aSJed Brown       nsum += n;
16238188e55aSJed Brown     }
16245f80ce2aSJacob Faibussowitsch     CHKERRMPI(MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A)));
162530bc264bSJed Brown     offset -= nsum;
1626e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
16275f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatRow(A,i,&sub));
16285f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetLocalSize(sub,&n,NULL));
16295f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetBlockSizes(sub,&bs,NULL));
16305f80ce2aSJacob Faibussowitsch       CHKERRQ(ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]));
16315f80ce2aSJacob Faibussowitsch       CHKERRQ(ISSetBlockSize(vs->isglobal.row[i],bs));
16322ae74bdbSJed Brown       offset += n;
1633d8588912SDave May     }
1634d8588912SDave May   }
1635d8588912SDave May 
1636d8588912SDave May   if (is_col) { /* valid IS is passed in */
1637a5b23f4aSJose E. Roman     /* refs on is[] are incremented */
1638e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
16395f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectReference((PetscObject)is_col[j]));
164026fbe8dcSKarl Rupp 
1641e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1642d8588912SDave May     }
16432ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
16442ae74bdbSJed Brown     offset = A->cmap->rstart;
16458188e55aSJed Brown     nsum   = 0;
16468188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
16475f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatCol(A,j,&sub));
1648*28b400f6SJacob Faibussowitsch       PetscCheck(sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %" PetscInt_FMT,i);
16495f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetLocalSize(sub,NULL,&n));
16502c71b3e2SJacob Faibussowitsch       PetscCheckFalse(n < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16518188e55aSJed Brown       nsum += n;
16528188e55aSJed Brown     }
16535f80ce2aSJacob Faibussowitsch     CHKERRMPI(MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A)));
165430bc264bSJed Brown     offset -= nsum;
1655e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
16565f80ce2aSJacob Faibussowitsch       CHKERRQ(MatNestFindNonzeroSubMatCol(A,j,&sub));
16575f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetLocalSize(sub,NULL,&n));
16585f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetBlockSizes(sub,NULL,&bs));
16595f80ce2aSJacob Faibussowitsch       CHKERRQ(ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]));
16605f80ce2aSJacob Faibussowitsch       CHKERRQ(ISSetBlockSize(vs->isglobal.col[j],bs));
16612ae74bdbSJed Brown       offset += n;
1662d8588912SDave May     }
1663d8588912SDave May   }
1664e2d7f03fSJed Brown 
1665e2d7f03fSJed Brown   /* Set up the local ISs */
16665f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(vs->nr,&vs->islocal.row));
16675f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(vs->nc,&vs->islocal.col));
1668e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1669e2d7f03fSJed Brown     IS                     isloc;
16700298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1671e2d7f03fSJed Brown     PetscInt               nlocal,bs;
16725f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestFindNonzeroSubMatRow(A,i,&sub));
16735f80ce2aSJacob Faibussowitsch     if (sub) CHKERRQ(MatGetLocalToGlobalMapping(sub,&rmap,NULL));
1674207556f9SJed Brown     if (rmap) {
16755f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetBlockSizes(sub,&bs,NULL));
16765f80ce2aSJacob Faibussowitsch       CHKERRQ(ISLocalToGlobalMappingGetSize(rmap,&nlocal));
16775f80ce2aSJacob Faibussowitsch       CHKERRQ(ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc));
16785f80ce2aSJacob Faibussowitsch       CHKERRQ(ISSetBlockSize(isloc,bs));
1679207556f9SJed Brown     } else {
1680207556f9SJed Brown       nlocal = 0;
16810298fd71SBarry Smith       isloc  = NULL;
1682207556f9SJed Brown     }
1683e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1684e2d7f03fSJed Brown     offset            += nlocal;
1685e2d7f03fSJed Brown   }
16868188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1687e2d7f03fSJed Brown     IS                     isloc;
16880298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1689e2d7f03fSJed Brown     PetscInt               nlocal,bs;
16905f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestFindNonzeroSubMatCol(A,i,&sub));
16915f80ce2aSJacob Faibussowitsch     if (sub) CHKERRQ(MatGetLocalToGlobalMapping(sub,NULL,&cmap));
1692207556f9SJed Brown     if (cmap) {
16935f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetBlockSizes(sub,NULL,&bs));
16945f80ce2aSJacob Faibussowitsch       CHKERRQ(ISLocalToGlobalMappingGetSize(cmap,&nlocal));
16955f80ce2aSJacob Faibussowitsch       CHKERRQ(ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc));
16965f80ce2aSJacob Faibussowitsch       CHKERRQ(ISSetBlockSize(isloc,bs));
1697207556f9SJed Brown     } else {
1698207556f9SJed Brown       nlocal = 0;
16990298fd71SBarry Smith       isloc  = NULL;
1700207556f9SJed Brown     }
1701e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1702e2d7f03fSJed Brown     offset            += nlocal;
1703e2d7f03fSJed Brown   }
17040189643fSJed Brown 
170577019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
170677019fcaSJed Brown   {
170745b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
17085f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap));
17095f80ce2aSJacob Faibussowitsch     CHKERRQ(MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap));
17105f80ce2aSJacob Faibussowitsch     if (rmap && cmap) CHKERRQ(MatSetLocalToGlobalMapping(A,rmap,cmap));
17115f80ce2aSJacob Faibussowitsch     CHKERRQ(ISLocalToGlobalMappingDestroy(&rmap));
17125f80ce2aSJacob Faibussowitsch     CHKERRQ(ISLocalToGlobalMappingDestroy(&cmap));
171377019fcaSJed Brown   }
171477019fcaSJed Brown 
171576bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
17160189643fSJed Brown     for (i=0; i<vs->nr; i++) {
17170189643fSJed Brown       for (j=0; j<vs->nc; j++) {
17180189643fSJed Brown         PetscInt m,n,M,N,mi,ni,Mi,Ni;
17190189643fSJed Brown         Mat      B = vs->m[i][j];
17200189643fSJed Brown         if (!B) continue;
17215f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetSize(B,&M,&N));
17225f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetLocalSize(B,&m,&n));
17235f80ce2aSJacob Faibussowitsch         CHKERRQ(ISGetSize(vs->isglobal.row[i],&Mi));
17245f80ce2aSJacob Faibussowitsch         CHKERRQ(ISGetSize(vs->isglobal.col[j],&Ni));
17255f80ce2aSJacob Faibussowitsch         CHKERRQ(ISGetLocalSize(vs->isglobal.row[i],&mi));
17265f80ce2aSJacob Faibussowitsch         CHKERRQ(ISGetLocalSize(vs->isglobal.col[j],&ni));
17272c71b3e2SJacob Faibussowitsch         PetscCheckFalse(M != Mi || N != Ni,PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")",M,N,i,j,Mi,Ni);
17282c71b3e2SJacob Faibussowitsch         PetscCheckFalse(m != mi || n != ni,PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")",m,n,i,j,mi,ni);
17290189643fSJed Brown       }
17300189643fSJed Brown     }
173176bd3646SJed Brown   }
1732a061e289SJed Brown 
1733a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1734a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1735a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1736a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1737a061e289SJed Brown     }
1738a061e289SJed Brown   }
1739a061e289SJed Brown   A->assembled = PETSC_TRUE;
1740d8588912SDave May   PetscFunctionReturn(0);
1741d8588912SDave May }
1742d8588912SDave May 
174345c38901SJed Brown /*@C
1744659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1745659c6bb0SJed Brown 
1746659c6bb0SJed Brown    Collective on Mat
1747659c6bb0SJed Brown 
1748d8d19677SJose E. Roman    Input Parameters:
1749659c6bb0SJed Brown +  comm - Communicator for the new Mat
1750659c6bb0SJed Brown .  nr - number of nested row blocks
17510298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1752659c6bb0SJed Brown .  nc - number of nested column blocks
17530298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
17540298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1755659c6bb0SJed Brown 
1756659c6bb0SJed Brown    Output Parameter:
1757659c6bb0SJed Brown .  B - new matrix
1758659c6bb0SJed Brown 
1759659c6bb0SJed Brown    Level: advanced
1760659c6bb0SJed Brown 
176179798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
176279798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
176379798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1764659c6bb0SJed Brown @*/
17657087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1766d8588912SDave May {
1767d8588912SDave May   Mat            A;
1768d8588912SDave May 
1769d8588912SDave May   PetscFunctionBegin;
1770f4259b30SLisandro Dalcin   *B   = NULL;
17715f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreate(comm,&A));
17725f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetType(A,MATNEST));
177391a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
17745f80ce2aSJacob Faibussowitsch   CHKERRQ(MatNestSetSubMats(A,nr,is_row,nc,is_col,a));
1775d8588912SDave May   *B   = A;
1776d8588912SDave May   PetscFunctionReturn(0);
1777d8588912SDave May }
1778659c6bb0SJed Brown 
1779be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1780b68353e5Sstefano_zampini {
1781b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
178223875855Sstefano_zampini   Mat            *trans;
1783b68353e5Sstefano_zampini   PetscScalar    **avv;
1784b68353e5Sstefano_zampini   PetscScalar    *vv;
1785b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1786b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1787b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1788b68353e5Sstefano_zampini   PetscBool      done;
1789b68353e5Sstefano_zampini 
1790b68353e5Sstefano_zampini   PetscFunctionBegin;
17915f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(A,&nr,&nc));
1792b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1793b68353e5Sstefano_zampini     PetscInt rnr;
1794b68353e5Sstefano_zampini 
17955f80ce2aSJacob Faibussowitsch     CHKERRQ(MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done));
1796*28b400f6SJacob Faibussowitsch     PetscCheck(done,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
17972c71b3e2SJacob Faibussowitsch     PetscCheckFalse(rnr != nr,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
17985f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSeqAIJGetArray(*newmat,&vv));
1799b68353e5Sstefano_zampini   }
1800b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1801b68353e5Sstefano_zampini   nnz  = 0;
18025f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans));
1803b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1804b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1805b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1806b68353e5Sstefano_zampini       if (B) {
1807b68353e5Sstefano_zampini         PetscScalar *naa;
1808b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
180923875855Sstefano_zampini         PetscBool   istrans;
1810b68353e5Sstefano_zampini 
18115f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans));
181223875855Sstefano_zampini         if (istrans) {
181323875855Sstefano_zampini           Mat Bt;
181423875855Sstefano_zampini 
18155f80ce2aSJacob Faibussowitsch           CHKERRQ(MatTransposeGetMat(B,&Bt));
18165f80ce2aSJacob Faibussowitsch           CHKERRQ(MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]));
181723875855Sstefano_zampini           B    = trans[i*nest->nc+j];
181823875855Sstefano_zampini         }
18195f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done));
1820*28b400f6SJacob Faibussowitsch         PetscCheck(done,PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
18215f80ce2aSJacob Faibussowitsch         CHKERRQ(MatSeqAIJGetArray(B,&naa));
1822b68353e5Sstefano_zampini         nnz += nii[nnr];
1823b68353e5Sstefano_zampini 
1824b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1825b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1826b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1827b68353e5Sstefano_zampini       }
1828b68353e5Sstefano_zampini     }
1829b68353e5Sstefano_zampini   }
1830b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
18315f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(nr+1,&ii));
18325f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(nnz,&jj));
18335f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscMalloc1(nnz,&vv));
1834b68353e5Sstefano_zampini   } else {
18352c71b3e2SJacob Faibussowitsch     PetscCheckFalse(nnz != ii[nr],PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1836b68353e5Sstefano_zampini   }
1837b68353e5Sstefano_zampini 
1838b68353e5Sstefano_zampini   /* new row pointer */
18395f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscArrayzero(ii,nr+1));
1840b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1841b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1842b68353e5Sstefano_zampini 
18435f80ce2aSJacob Faibussowitsch     CHKERRQ(ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL));
18445f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(nest->isglobal.row[i],&ncr));
1845b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1846b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1847b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1848b68353e5Sstefano_zampini         PetscInt    ir;
1849b68353e5Sstefano_zampini 
1850b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1851b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1852b68353e5Sstefano_zampini           nii++;
1853b68353e5Sstefano_zampini         }
1854b68353e5Sstefano_zampini       }
1855b68353e5Sstefano_zampini     }
1856b68353e5Sstefano_zampini   }
1857b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1858b68353e5Sstefano_zampini 
1859b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
18605f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscCalloc1(nr,&ci));
1861b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1862b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1863b68353e5Sstefano_zampini 
18645f80ce2aSJacob Faibussowitsch     CHKERRQ(ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL));
18655f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetLocalSize(nest->isglobal.row[i],&ncr));
1866b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1867b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1868b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1869b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1870b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1871b68353e5Sstefano_zampini         PetscInt    ir,cst;
1872b68353e5Sstefano_zampini 
18735f80ce2aSJacob Faibussowitsch         CHKERRQ(ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL));
1874b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1875b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1876b68353e5Sstefano_zampini 
1877b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1878b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1879b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1880b68353e5Sstefano_zampini             njj++;
1881b68353e5Sstefano_zampini             nvv++;
1882b68353e5Sstefano_zampini           }
1883b68353e5Sstefano_zampini           ci[ir] += rsize;
1884b68353e5Sstefano_zampini           nii++;
1885b68353e5Sstefano_zampini         }
1886b68353e5Sstefano_zampini       }
1887b68353e5Sstefano_zampini     }
1888b68353e5Sstefano_zampini   }
18895f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(ci));
1890b68353e5Sstefano_zampini 
1891b68353e5Sstefano_zampini   /* restore info */
1892b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1893b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1894b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1895b68353e5Sstefano_zampini       if (B) {
1896b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
189723875855Sstefano_zampini 
189823875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
18995f80ce2aSJacob Faibussowitsch         CHKERRQ(MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done));
1900*28b400f6SJacob Faibussowitsch         PetscCheck(done,PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
19015f80ce2aSJacob Faibussowitsch         CHKERRQ(MatSeqAIJRestoreArray(B,&avv[k]));
19025f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDestroy(&trans[k]));
1903b68353e5Sstefano_zampini       }
1904b68353e5Sstefano_zampini     }
1905b68353e5Sstefano_zampini   }
19065f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree4(aii,ajj,avv,trans));
1907b68353e5Sstefano_zampini 
1908b68353e5Sstefano_zampini   /* finalize newmat */
1909b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
19105f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat));
1911b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1912b68353e5Sstefano_zampini     Mat B;
1913b68353e5Sstefano_zampini 
19145f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B));
19155f80ce2aSJacob Faibussowitsch     CHKERRQ(MatHeaderReplace(A,&B));
1916b68353e5Sstefano_zampini   }
19175f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY));
19185f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY));
1919b68353e5Sstefano_zampini   {
1920b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1921b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1922b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1923b68353e5Sstefano_zampini   }
1924b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1925b68353e5Sstefano_zampini }
1926b68353e5Sstefano_zampini 
1927be705e3aSPierre Jolivet PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y,PetscScalar a,Mat X)
1928be705e3aSPierre Jolivet {
1929be705e3aSPierre Jolivet   Mat_Nest       *nest = (Mat_Nest*)X->data;
1930be705e3aSPierre Jolivet   PetscInt       i,j,k,rstart;
1931be705e3aSPierre Jolivet   PetscBool      flg;
1932be705e3aSPierre Jolivet 
1933be705e3aSPierre Jolivet   PetscFunctionBegin;
1934be705e3aSPierre Jolivet   /* Fill by row */
1935be705e3aSPierre Jolivet   for (j=0; j<nest->nc; ++j) {
1936be705e3aSPierre Jolivet     /* Using global column indices and ISAllGather() is not scalable. */
1937be705e3aSPierre Jolivet     IS             bNis;
1938be705e3aSPierre Jolivet     PetscInt       bN;
1939be705e3aSPierre Jolivet     const PetscInt *bNindices;
19405f80ce2aSJacob Faibussowitsch     CHKERRQ(ISAllGather(nest->isglobal.col[j], &bNis));
19415f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bNis,&bN));
19425f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetIndices(bNis,&bNindices));
1943be705e3aSPierre Jolivet     for (i=0; i<nest->nr; ++i) {
1944be705e3aSPierre Jolivet       Mat            B,D=NULL;
1945be705e3aSPierre Jolivet       PetscInt       bm, br;
1946be705e3aSPierre Jolivet       const PetscInt *bmindices;
1947be705e3aSPierre Jolivet       B = nest->m[i][j];
1948be705e3aSPierre Jolivet       if (!B) continue;
19495f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&flg));
1950be705e3aSPierre Jolivet       if (flg) {
19515f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscTryMethod(B,"MatTransposeGetMat_C",(Mat,Mat*),(B,&D)));
19525f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscTryMethod(B,"MatHermitianTransposeGetMat_C",(Mat,Mat*),(B,&D)));
19535f80ce2aSJacob Faibussowitsch         CHKERRQ(MatConvert(B,((PetscObject)D)->type_name,MAT_INITIAL_MATRIX,&D));
1954be705e3aSPierre Jolivet         B = D;
1955be705e3aSPierre Jolivet       }
19565f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQSBAIJ,MATMPISBAIJ,""));
1957be705e3aSPierre Jolivet       if (flg) {
1958be705e3aSPierre Jolivet         if (D) {
19595f80ce2aSJacob Faibussowitsch           CHKERRQ(MatConvert(D,MATBAIJ,MAT_INPLACE_MATRIX,&D));
1960be705e3aSPierre Jolivet         } else {
19615f80ce2aSJacob Faibussowitsch           CHKERRQ(MatConvert(B,MATBAIJ,MAT_INITIAL_MATRIX,&D));
1962be705e3aSPierre Jolivet         }
1963be705e3aSPierre Jolivet         B = D;
1964be705e3aSPierre Jolivet       }
19655f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(nest->isglobal.row[i],&bm));
19665f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetIndices(nest->isglobal.row[i],&bmindices));
19675f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetOwnershipRange(B,&rstart,NULL));
1968be705e3aSPierre Jolivet       for (br = 0; br < bm; ++br) {
1969be705e3aSPierre Jolivet         PetscInt          row = bmindices[br], brncols, *cols;
1970be705e3aSPierre Jolivet         const PetscInt    *brcols;
1971be705e3aSPierre Jolivet         const PetscScalar *brcoldata;
1972be705e3aSPierre Jolivet         PetscScalar       *vals = NULL;
19735f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata));
19745f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscMalloc1(brncols,&cols));
1975be705e3aSPierre Jolivet         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
1976be705e3aSPierre Jolivet         /*
1977be705e3aSPierre Jolivet           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
1978be705e3aSPierre Jolivet           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
1979be705e3aSPierre Jolivet          */
1980be705e3aSPierre Jolivet         if (a != 1.0) {
19815f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscMalloc1(brncols,&vals));
1982be705e3aSPierre Jolivet           for (k=0; k<brncols; k++) vals[k] = a * brcoldata[k];
19835f80ce2aSJacob Faibussowitsch           CHKERRQ(MatSetValues(Y,1,&row,brncols,cols,vals,ADD_VALUES));
19845f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscFree(vals));
1985be705e3aSPierre Jolivet         } else {
19865f80ce2aSJacob Faibussowitsch           CHKERRQ(MatSetValues(Y,1,&row,brncols,cols,brcoldata,ADD_VALUES));
1987be705e3aSPierre Jolivet         }
19885f80ce2aSJacob Faibussowitsch         CHKERRQ(MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata));
19895f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscFree(cols));
1990be705e3aSPierre Jolivet       }
1991be705e3aSPierre Jolivet       if (D) {
19925f80ce2aSJacob Faibussowitsch         CHKERRQ(MatDestroy(&D));
1993be705e3aSPierre Jolivet       }
19945f80ce2aSJacob Faibussowitsch       CHKERRQ(ISRestoreIndices(nest->isglobal.row[i],&bmindices));
1995be705e3aSPierre Jolivet     }
19965f80ce2aSJacob Faibussowitsch     CHKERRQ(ISRestoreIndices(bNis,&bNindices));
19975f80ce2aSJacob Faibussowitsch     CHKERRQ(ISDestroy(&bNis));
1998be705e3aSPierre Jolivet   }
19995f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY));
20005f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY));
2001be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2002be705e3aSPierre Jolivet }
2003be705e3aSPierre Jolivet 
2004be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2005629c3df2SDmitry Karpeev {
2006629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
2007be705e3aSPierre Jolivet   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart,cstart,cend;
2008b68353e5Sstefano_zampini   PetscMPIInt    size;
2009629c3df2SDmitry Karpeev   Mat            C;
2010629c3df2SDmitry Karpeev 
2011629c3df2SDmitry Karpeev   PetscFunctionBegin;
20125f80ce2aSJacob Faibussowitsch   CHKERRMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A),&size));
2013b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
2014b68353e5Sstefano_zampini     PetscInt  nf;
2015b68353e5Sstefano_zampini     PetscBool fast;
2016b68353e5Sstefano_zampini 
20175f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscStrcmp(newtype,MATAIJ,&fast));
2018b68353e5Sstefano_zampini     if (!fast) {
20195f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscStrcmp(newtype,MATSEQAIJ,&fast));
2020b68353e5Sstefano_zampini     }
2021b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
2022b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
2023b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
2024b68353e5Sstefano_zampini         if (B) {
20255f80ce2aSJacob Faibussowitsch           CHKERRQ(PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast));
202623875855Sstefano_zampini           if (!fast) {
202723875855Sstefano_zampini             PetscBool istrans;
202823875855Sstefano_zampini 
20295f80ce2aSJacob Faibussowitsch             CHKERRQ(PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans));
203023875855Sstefano_zampini             if (istrans) {
203123875855Sstefano_zampini               Mat Bt;
203223875855Sstefano_zampini 
20335f80ce2aSJacob Faibussowitsch               CHKERRQ(MatTransposeGetMat(B,&Bt));
20345f80ce2aSJacob Faibussowitsch               CHKERRQ(PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast));
203523875855Sstefano_zampini             }
2036b68353e5Sstefano_zampini           }
2037b68353e5Sstefano_zampini         }
2038b68353e5Sstefano_zampini       }
2039b68353e5Sstefano_zampini     }
2040b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
20415f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast));
2042b68353e5Sstefano_zampini       if (fast) {
2043b68353e5Sstefano_zampini         PetscInt f,s;
2044b68353e5Sstefano_zampini 
20455f80ce2aSJacob Faibussowitsch         CHKERRQ(ISStrideGetInfo(nest->isglobal.row[i],&f,&s));
2046b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2047b68353e5Sstefano_zampini         else {
20485f80ce2aSJacob Faibussowitsch           CHKERRQ(ISGetSize(nest->isglobal.row[i],&f));
2049b68353e5Sstefano_zampini           nf  += f;
2050b68353e5Sstefano_zampini         }
2051b68353e5Sstefano_zampini       }
2052b68353e5Sstefano_zampini     }
2053b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
20545f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast));
2055b68353e5Sstefano_zampini       if (fast) {
2056b68353e5Sstefano_zampini         PetscInt f,s;
2057b68353e5Sstefano_zampini 
20585f80ce2aSJacob Faibussowitsch         CHKERRQ(ISStrideGetInfo(nest->isglobal.col[i],&f,&s));
2059b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2060b68353e5Sstefano_zampini         else {
20615f80ce2aSJacob Faibussowitsch           CHKERRQ(ISGetSize(nest->isglobal.col[i],&f));
2062b68353e5Sstefano_zampini           nf  += f;
2063b68353e5Sstefano_zampini         }
2064b68353e5Sstefano_zampini       }
2065b68353e5Sstefano_zampini     }
2066b68353e5Sstefano_zampini     if (fast) {
20675f80ce2aSJacob Faibussowitsch       CHKERRQ(MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat));
2068b68353e5Sstefano_zampini       PetscFunctionReturn(0);
2069b68353e5Sstefano_zampini     }
2070b68353e5Sstefano_zampini   }
20715f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(A,&M,&N));
20725f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetLocalSize(A,&m,&n));
20735f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetOwnershipRangeColumn(A,&cstart,&cend));
2074d1487292SPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) C = *newmat;
2075d1487292SPierre Jolivet   else {
20765f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreate(PetscObjectComm((PetscObject)A),&C));
20775f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetType(C,newtype));
20785f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetSizes(C,m,n,M,N));
2079629c3df2SDmitry Karpeev   }
20805f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMalloc1(2*m,&dnnz));
2081629c3df2SDmitry Karpeev   onnz = dnnz + m;
2082629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
2083629c3df2SDmitry Karpeev     dnnz[k] = 0;
2084629c3df2SDmitry Karpeev     onnz[k] = 0;
2085629c3df2SDmitry Karpeev   }
2086629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
2087629c3df2SDmitry Karpeev     IS             bNis;
2088629c3df2SDmitry Karpeev     PetscInt       bN;
2089629c3df2SDmitry Karpeev     const PetscInt *bNindices;
2090629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
20915f80ce2aSJacob Faibussowitsch     CHKERRQ(ISAllGather(nest->isglobal.col[j], &bNis));
20925f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetSize(bNis, &bN));
20935f80ce2aSJacob Faibussowitsch     CHKERRQ(ISGetIndices(bNis,&bNindices));
2094629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2095629c3df2SDmitry Karpeev       PetscSF        bmsf;
2096649b366bSFande Kong       PetscSFNode    *iremote;
2097629c3df2SDmitry Karpeev       Mat            B;
2098649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
2099629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2100629c3df2SDmitry Karpeev       B = nest->m[i][j];
2101629c3df2SDmitry Karpeev       if (!B) continue;
21025f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetLocalSize(nest->isglobal.row[i],&bm));
21035f80ce2aSJacob Faibussowitsch       CHKERRQ(ISGetIndices(nest->isglobal.row[i],&bmindices));
21045f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf));
21055f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscMalloc1(bm,&iremote));
21065f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscMalloc1(bm,&sub_dnnz));
21075f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscMalloc1(bm,&sub_onnz));
2108649b366bSFande Kong       for (k = 0; k < bm; ++k) {
2109649b366bSFande Kong         sub_dnnz[k] = 0;
2110649b366bSFande Kong         sub_onnz[k] = 0;
2111649b366bSFande Kong       }
2112629c3df2SDmitry Karpeev       /*
2113629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
2114629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
2115629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
2116629c3df2SDmitry Karpeev        */
21175f80ce2aSJacob Faibussowitsch       CHKERRQ(MatGetOwnershipRange(B,&rstart,NULL));
2118629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2119131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
2120629c3df2SDmitry Karpeev         const PetscInt *brcols;
2121a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
2122131c27b5Sprj-         PetscMPIInt    rowowner = 0;
21235f80ce2aSJacob Faibussowitsch         CHKERRQ(PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel));
2124649b366bSFande Kong         /* how many roots  */
2125649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
2126649b366bSFande Kong         /* get nonzero pattern */
21275f80ce2aSJacob Faibussowitsch         CHKERRQ(MatGetRow(B,br+rstart,&brncols,&brcols,NULL));
2128629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
2129629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
2130649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
2131649b366bSFande Kong             sub_dnnz[br]++;
2132649b366bSFande Kong           } else {
2133649b366bSFande Kong             sub_onnz[br]++;
2134649b366bSFande Kong           }
2135629c3df2SDmitry Karpeev         }
21365f80ce2aSJacob Faibussowitsch         CHKERRQ(MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL));
2137629c3df2SDmitry Karpeev       }
21385f80ce2aSJacob Faibussowitsch       CHKERRQ(ISRestoreIndices(nest->isglobal.row[i],&bmindices));
2139629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
21405f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER));
21415f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM));
21425f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM));
21435f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM));
21445f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM));
21455f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscFree(sub_dnnz));
21465f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscFree(sub_onnz));
21475f80ce2aSJacob Faibussowitsch       CHKERRQ(PetscSFDestroy(&bmsf));
2148629c3df2SDmitry Karpeev     }
21495f80ce2aSJacob Faibussowitsch     CHKERRQ(ISRestoreIndices(bNis,&bNindices));
21505f80ce2aSJacob Faibussowitsch     CHKERRQ(ISDestroy(&bNis));
215165a4a0a3Sstefano_zampini   }
215265a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
215365a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
215465a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
215565a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
2156629c3df2SDmitry Karpeev   }
21575f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSeqAIJSetPreallocation(C,0,dnnz));
21585f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz));
21595f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscFree(dnnz));
21605f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY_Dense_Nest(C,1.0,A));
2161d1487292SPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) {
21625f80ce2aSJacob Faibussowitsch     CHKERRQ(MatHeaderReplace(A,&C));
2163d1487292SPierre Jolivet   } else *newmat = C;
2164be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2165be705e3aSPierre Jolivet }
2166629c3df2SDmitry Karpeev 
2167be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_Dense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2168be705e3aSPierre Jolivet {
2169629c3df2SDmitry Karpeev   Mat            B;
2170be705e3aSPierre Jolivet   PetscInt       m,n,M,N;
2171be705e3aSPierre Jolivet 
2172be705e3aSPierre Jolivet   PetscFunctionBegin;
21735f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetSize(A,&M,&N));
21745f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetLocalSize(A,&m,&n));
2175be705e3aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
2176be705e3aSPierre Jolivet     B = *newmat;
21775f80ce2aSJacob Faibussowitsch     CHKERRQ(MatZeroEntries(B));
2178be705e3aSPierre Jolivet   } else {
21795f80ce2aSJacob Faibussowitsch     CHKERRQ(MatCreateDense(PetscObjectComm((PetscObject)A),m,PETSC_DECIDE,M,N,NULL,&B));
2180629c3df2SDmitry Karpeev   }
21815f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY_Dense_Nest(B,1.0,A));
2182be705e3aSPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) {
21835f80ce2aSJacob Faibussowitsch     CHKERRQ(MatHeaderReplace(A,&B));
2184be705e3aSPierre Jolivet   } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B;
2185629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
2186629c3df2SDmitry Karpeev }
2187629c3df2SDmitry Karpeev 
21888b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
21898b7d3b4bSBarry Smith {
21908b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
21913c6db4c4SPierre Jolivet   MatOperation   opAdd;
21928b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
21938b7d3b4bSBarry Smith   PetscBool      flg;
219452c5f739Sprj-   PetscFunctionBegin;
21958b7d3b4bSBarry Smith 
219652c5f739Sprj-   *has = PETSC_FALSE;
21973c6db4c4SPierre Jolivet   if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) {
21983c6db4c4SPierre Jolivet     opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD);
21998b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
22008b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
22018b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
22025f80ce2aSJacob Faibussowitsch         CHKERRQ(MatHasOperation(bA->m[i][j],opAdd,&flg));
22038b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
22048b7d3b4bSBarry Smith       }
22058b7d3b4bSBarry Smith     }
22068b7d3b4bSBarry Smith   }
22073c6db4c4SPierre Jolivet   if (((void**)mat->ops)[op]) *has = PETSC_TRUE;
22088b7d3b4bSBarry Smith   PetscFunctionReturn(0);
22098b7d3b4bSBarry Smith }
22108b7d3b4bSBarry Smith 
2211659c6bb0SJed Brown /*MC
2212659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
2213659c6bb0SJed Brown 
2214659c6bb0SJed Brown   Level: intermediate
2215659c6bb0SJed Brown 
2216659c6bb0SJed Brown   Notes:
2217659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
2218659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
2219950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
2220659c6bb0SJed Brown 
22218b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
22228b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
22238b7d3b4bSBarry Smith   than the nest matrix.
22248b7d3b4bSBarry Smith 
222579798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
222679798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
222779798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
2228659c6bb0SJed Brown M*/
22298cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
2230c8883902SJed Brown {
2231c8883902SJed Brown   Mat_Nest       *s;
2232c8883902SJed Brown 
2233c8883902SJed Brown   PetscFunctionBegin;
22345f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscNewLog(A,&s));
2235c8883902SJed Brown   A->data = (void*)s;
2236e7c19651SJed Brown 
2237e7c19651SJed Brown   s->nr            = -1;
2238e7c19651SJed Brown   s->nc            = -1;
22390298fd71SBarry Smith   s->m             = NULL;
2240e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
2241c8883902SJed Brown 
22425f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscMemzero(A->ops,sizeof(*A->ops)));
224326fbe8dcSKarl Rupp 
2244c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
22459194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2246c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
22479194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2248f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2249c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2250c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2251c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2252c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
22536e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2254c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
22557dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2256c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2257c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2258f4259b30SLisandro Dalcin   A->ops->getvecs               = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2259c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2260c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2261429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2262429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2263a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2264a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
226513135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2266f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
22678b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2268381b8e50SStefano Zampini   A->ops->missingdiagonal       = MatMissingDiagonal_Nest;
2269c8883902SJed Brown 
2270f4259b30SLisandro Dalcin   A->spptr        = NULL;
2271c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2272c8883902SJed Brown 
2273c8883902SJed Brown   /* expose Nest api's */
22745f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest));
22755f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest));
22765f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest));
22775f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest));
22785f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest));
22795f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest));
22805f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest));
22815f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest));
22825f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ));
22835f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ));
22845f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ));
22855f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS));
22865f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",MatConvert_Nest_Dense));
22875f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",MatConvert_Nest_Dense));
22885f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense));
22895f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense));
22905f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense));
2291c8883902SJed Brown 
22925f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectChangeTypeName((PetscObject)A,MATNEST));
2293c8883902SJed Brown   PetscFunctionReturn(0);
2294c8883902SJed Brown }
2295