xref: /petsc/src/mat/impls/nest/matnest.c (revision f4259b3095b7e7c300c2b3c3729548b071684bd7)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*);
706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat);
806a1af2fSStefano Zampini 
95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
10c8883902SJed Brown 
11d8588912SDave May /* private functions */
128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
13d8588912SDave May {
14d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
158188e55aSJed Brown   PetscInt       i,j;
16d8588912SDave May   PetscErrorCode ierr;
17d8588912SDave May 
18d8588912SDave May   PetscFunctionBegin;
198188e55aSJed Brown   *m = *n = *M = *N = 0;
208188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
218188e55aSJed Brown     PetscInt sm,sM;
228188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr);
238188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr);
248188e55aSJed Brown     *m  += sm;
258188e55aSJed Brown     *M  += sM;
26d8588912SDave May   }
278188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
288188e55aSJed Brown     PetscInt sn,sN;
298188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr);
308188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr);
318188e55aSJed Brown     *n  += sn;
328188e55aSJed Brown     *N  += sN;
33d8588912SDave May   }
34d8588912SDave May   PetscFunctionReturn(0);
35d8588912SDave May }
36d8588912SDave May 
37d8588912SDave May /* operations */
38207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
39d8588912SDave May {
40d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
41207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
42207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
43d8588912SDave May   PetscErrorCode ierr;
44d8588912SDave May 
45d8588912SDave May   PetscFunctionBegin;
46207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
47207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
48207556f9SJed Brown   for (i=0; i<nr; i++) {
49d8588912SDave May     ierr = VecZeroEntries(by[i]);CHKERRQ(ierr);
50207556f9SJed Brown     for (j=0; j<nc; j++) {
51207556f9SJed Brown       if (!bA->m[i][j]) continue;
52d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
53d8588912SDave May       ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr);
54d8588912SDave May     }
55d8588912SDave May   }
56207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
57207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
58d8588912SDave May   PetscFunctionReturn(0);
59d8588912SDave May }
60d8588912SDave May 
619194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
629194d70fSJed Brown {
639194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
649194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
659194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
669194d70fSJed Brown   PetscErrorCode ierr;
679194d70fSJed Brown 
689194d70fSJed Brown   PetscFunctionBegin;
699194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
709194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
719194d70fSJed Brown   for (i=0; i<nr; i++) {
729194d70fSJed Brown     if (y != z) {
739194d70fSJed Brown       Vec by;
749194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
759194d70fSJed Brown       ierr = VecCopy(by,bz[i]);CHKERRQ(ierr);
76336d21e7SJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
779194d70fSJed Brown     }
789194d70fSJed Brown     for (j=0; j<nc; j++) {
799194d70fSJed Brown       if (!bA->m[i][j]) continue;
809194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
819194d70fSJed Brown       ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr);
829194d70fSJed Brown     }
839194d70fSJed Brown   }
849194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
859194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
869194d70fSJed Brown   PetscFunctionReturn(0);
879194d70fSJed Brown }
889194d70fSJed Brown 
8952c5f739Sprj- typedef struct {
9052c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
9152c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
9252c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9352c5f739Sprj- } Nest_Dense;
9452c5f739Sprj- 
956718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C)
9652c5f739Sprj- {
976718818eSStefano Zampini   Mat_Nest          *bA;
9852c5f739Sprj-   Nest_Dense        *contents;
996718818eSStefano Zampini   Mat               viewB,viewC,productB,workC;
10052c5f739Sprj-   const PetscScalar *barray;
10152c5f739Sprj-   PetscScalar       *carray;
1026718818eSStefano Zampini   PetscInt          i,j,M,N,nr,nc,ldb,ldc;
10352c5f739Sprj-   PetscErrorCode    ierr;
1046718818eSStefano Zampini   Mat               A,B;
10552c5f739Sprj- 
10652c5f739Sprj-   PetscFunctionBegin;
1076718818eSStefano Zampini   MatCheckProduct(C,3);
1086718818eSStefano Zampini   A    = C->product->A;
1096718818eSStefano Zampini   B    = C->product->B;
1106718818eSStefano Zampini   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
1116718818eSStefano Zampini   if (!N) {
1126718818eSStefano Zampini     ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1136718818eSStefano Zampini     ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1146718818eSStefano Zampini     PetscFunctionReturn(0);
1156718818eSStefano Zampini   }
1166718818eSStefano Zampini   contents = (Nest_Dense*)C->product->data;
1176718818eSStefano Zampini   if (!contents) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty");
1186718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1196718818eSStefano Zampini   nr   = bA->nr;
1206718818eSStefano Zampini   nc   = bA->nc;
12152c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
12252c5f739Sprj-   ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr);
12352c5f739Sprj-   ierr = MatZeroEntries(C);CHKERRQ(ierr);
12452c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
1256718818eSStefano Zampini   ierr = MatDenseGetArrayWrite(C,&carray);CHKERRQ(ierr);
12652c5f739Sprj-   for (i=0; i<nr; i++) {
12752c5f739Sprj-     ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr);
12852c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr);
1296718818eSStefano Zampini     ierr = MatDenseSetLDA(viewC,ldc);CHKERRQ(ierr);
13052c5f739Sprj-     for (j=0; j<nc; j++) {
13152c5f739Sprj-       if (!bA->m[i][j]) continue;
13252c5f739Sprj-       ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
13352c5f739Sprj-       ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
1346718818eSStefano Zampini       ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
1354222ddf1SHong Zhang 
1364222ddf1SHong Zhang       /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */
1374222ddf1SHong Zhang       workC             = contents->workC[i*nc + j];
1384222ddf1SHong Zhang       productB          = workC->product->B;
1394222ddf1SHong Zhang       workC->product->B = viewB; /* use newly created dense matrix viewB */
1406718818eSStefano Zampini       ierr = MatProductNumeric(workC);CHKERRQ(ierr);
14152c5f739Sprj-       ierr = MatDestroy(&viewB);CHKERRQ(ierr);
1424222ddf1SHong Zhang       workC->product->B = productB; /* resume original B */
1434222ddf1SHong Zhang 
14452c5f739Sprj-       /* C[i] <- workC + C[i] */
14552c5f739Sprj-       ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr);
14652c5f739Sprj-     }
14752c5f739Sprj-     ierr = MatDestroy(&viewC);CHKERRQ(ierr);
14852c5f739Sprj-   }
1496718818eSStefano Zampini   ierr = MatDenseRestoreArrayWrite(C,&carray);CHKERRQ(ierr);
15052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
1514222ddf1SHong Zhang 
1524222ddf1SHong Zhang   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1534222ddf1SHong Zhang   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15452c5f739Sprj-   PetscFunctionReturn(0);
15552c5f739Sprj- }
15652c5f739Sprj- 
15752c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
15852c5f739Sprj- {
15952c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
16052c5f739Sprj-   PetscInt       i;
16152c5f739Sprj-   PetscErrorCode ierr;
16252c5f739Sprj- 
16352c5f739Sprj-   PetscFunctionBegin;
16452c5f739Sprj-   ierr = PetscFree(contents->tarray);CHKERRQ(ierr);
16552c5f739Sprj-   for (i=0; i<contents->k; i++) {
16652c5f739Sprj-     ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr);
16752c5f739Sprj-   }
16852c5f739Sprj-   ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr);
16952c5f739Sprj-   ierr = PetscFree(contents);CHKERRQ(ierr);
17052c5f739Sprj-   PetscFunctionReturn(0);
17152c5f739Sprj- }
17252c5f739Sprj- 
1736718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C)
17452c5f739Sprj- {
1756718818eSStefano Zampini   Mat_Nest          *bA;
1766718818eSStefano Zampini   Mat               viewB,workC;
17752c5f739Sprj-   const PetscScalar *barray;
1786718818eSStefano Zampini   PetscInt          i,j,M,N,m,n,nr,nc,maxm = 0,ldb;
1794222ddf1SHong Zhang   Nest_Dense        *contents=NULL;
1806718818eSStefano Zampini   PetscBool         cisdense;
18152c5f739Sprj-   PetscErrorCode    ierr;
1826718818eSStefano Zampini   Mat               A,B;
1836718818eSStefano Zampini   PetscReal         fill;
18452c5f739Sprj- 
18552c5f739Sprj-   PetscFunctionBegin;
1866718818eSStefano Zampini   MatCheckProduct(C,4);
1876718818eSStefano Zampini   if (C->product->data) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty");
1886718818eSStefano Zampini   A    = C->product->A;
1896718818eSStefano Zampini   B    = C->product->B;
1906718818eSStefano Zampini   fill = C->product->fill;
1916718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1926718818eSStefano Zampini   nr   = bA->nr;
1936718818eSStefano Zampini   nc   = bA->nc;
1946718818eSStefano Zampini   ierr = MatGetLocalSize(B,NULL,&n);CHKERRQ(ierr);
19552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
19652c5f739Sprj-   ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr);
19752c5f739Sprj-   ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr);
1986718818eSStefano Zampini   ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1996718818eSStefano Zampini   ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,"");CHKERRQ(ierr);
2006718818eSStefano Zampini   if (!cisdense) {
2016718818eSStefano Zampini     ierr = MatSetType(C,((PetscObject)B)->type_name);CHKERRQ(ierr);
2026718818eSStefano Zampini   }
20318992e5dSStefano Zampini   ierr = MatSetUp(C);CHKERRQ(ierr);
2046718818eSStefano Zampini   if (!N) {
2056718818eSStefano Zampini     C->ops->productnumeric = MatProductNumeric_Nest_Dense;
2066718818eSStefano Zampini     PetscFunctionReturn(0);
20752c5f739Sprj-   }
20852c5f739Sprj- 
20952c5f739Sprj-   ierr = PetscNew(&contents);CHKERRQ(ierr);
2106718818eSStefano Zampini   C->product->data = contents;
2116718818eSStefano Zampini   C->product->destroy = MatNest_DenseDestroy;
21252c5f739Sprj-   ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr);
21352c5f739Sprj-   contents->k = nr*nc;
21452c5f739Sprj-   for (i=0; i<nr; i++) {
21552c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr);
21652c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
21752c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
21852c5f739Sprj-   }
21952c5f739Sprj-   for (i=0; i<nc; i++) {
22052c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr);
22152c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
22252c5f739Sprj-   }
22352c5f739Sprj-   ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr);
22452c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
22552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
22652c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
22752c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
22852c5f739Sprj-   for (j=0; j<nc; j++) {
22952c5f739Sprj-     ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
23052c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
2316718818eSStefano Zampini     ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
23252c5f739Sprj-     for (i=0; i<nr; i++) {
23352c5f739Sprj-       if (!bA->m[i][j]) continue;
23452c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
2354222ddf1SHong Zhang 
2364222ddf1SHong Zhang       ierr = MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]);CHKERRQ(ierr);
2374222ddf1SHong Zhang       workC = contents->workC[i*nc + j];
2384222ddf1SHong Zhang       ierr = MatProductSetType(workC,MATPRODUCT_AB);CHKERRQ(ierr);
2394222ddf1SHong Zhang       ierr = MatProductSetAlgorithm(workC,"default");CHKERRQ(ierr);
2404222ddf1SHong Zhang       ierr = MatProductSetFill(workC,fill);CHKERRQ(ierr);
2414222ddf1SHong Zhang       ierr = MatProductSetFromOptions(workC);CHKERRQ(ierr);
2424222ddf1SHong Zhang       ierr = MatProductSymbolic(workC);CHKERRQ(ierr);
2434222ddf1SHong Zhang 
2446718818eSStefano Zampini       /* since tarray will be shared by all Mat */
2456718818eSStefano Zampini       ierr = MatSeqDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
2466718818eSStefano Zampini       ierr = MatMPIDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
24752c5f739Sprj-     }
24852c5f739Sprj-     ierr = MatDestroy(&viewB);CHKERRQ(ierr);
24952c5f739Sprj-   }
25052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
25152c5f739Sprj- 
2526718818eSStefano Zampini   C->ops->productnumeric = MatProductNumeric_Nest_Dense;
25352c5f739Sprj-   PetscFunctionReturn(0);
25452c5f739Sprj- }
25552c5f739Sprj- 
2564222ddf1SHong Zhang /* --------------------------------------------------------- */
2574222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C)
2584222ddf1SHong Zhang {
2594222ddf1SHong Zhang   PetscFunctionBegin;
2606718818eSStefano Zampini   C->ops->productsymbolic = MatProductSymbolic_Nest_Dense;
2614222ddf1SHong Zhang   PetscFunctionReturn(0);
2624222ddf1SHong Zhang }
2634222ddf1SHong Zhang 
2644222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C)
26552c5f739Sprj- {
26652c5f739Sprj-   PetscErrorCode ierr;
2674222ddf1SHong Zhang   Mat_Product    *product = C->product;
26852c5f739Sprj- 
26952c5f739Sprj-   PetscFunctionBegin;
2704222ddf1SHong Zhang   if (product->type == MATPRODUCT_AB) {
2714222ddf1SHong Zhang     ierr = MatProductSetFromOptions_Nest_Dense_AB(C);CHKERRQ(ierr);
2726718818eSStefano Zampini   }
27352c5f739Sprj-   PetscFunctionReturn(0);
27452c5f739Sprj- }
2754222ddf1SHong Zhang /* --------------------------------------------------------- */
27652c5f739Sprj- 
277207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
278d8588912SDave May {
279d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
280207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
281207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
282d8588912SDave May   PetscErrorCode ierr;
283d8588912SDave May 
284d8588912SDave May   PetscFunctionBegin;
285609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
286609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
287207556f9SJed Brown   for (j=0; j<nc; j++) {
288609e31cbSJed Brown     ierr = VecZeroEntries(by[j]);CHKERRQ(ierr);
289609e31cbSJed Brown     for (i=0; i<nr; i++) {
2906c75ac25SJed Brown       if (!bA->m[i][j]) continue;
291609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
292609e31cbSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr);
293d8588912SDave May     }
294d8588912SDave May   }
295609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
296609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
297d8588912SDave May   PetscFunctionReturn(0);
298d8588912SDave May }
299d8588912SDave May 
3009194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
3019194d70fSJed Brown {
3029194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
3039194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
3049194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
3059194d70fSJed Brown   PetscErrorCode ierr;
3069194d70fSJed Brown 
3079194d70fSJed Brown   PetscFunctionBegin;
3089194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3099194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3109194d70fSJed Brown   for (j=0; j<nc; j++) {
3119194d70fSJed Brown     if (y != z) {
3129194d70fSJed Brown       Vec by;
3139194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3149194d70fSJed Brown       ierr = VecCopy(by,bz[j]);CHKERRQ(ierr);
3159194d70fSJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3169194d70fSJed Brown     }
3179194d70fSJed Brown     for (i=0; i<nr; i++) {
3186c75ac25SJed Brown       if (!bA->m[i][j]) continue;
3199194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
3209194d70fSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr);
3219194d70fSJed Brown     }
3229194d70fSJed Brown   }
3239194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3249194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3259194d70fSJed Brown   PetscFunctionReturn(0);
3269194d70fSJed Brown }
3279194d70fSJed Brown 
328f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
329f8170845SAlex Fikl {
330f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
331f8170845SAlex Fikl   Mat            C;
332f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
333f8170845SAlex Fikl   PetscErrorCode ierr;
334f8170845SAlex Fikl 
335f8170845SAlex Fikl   PetscFunctionBegin;
336cf37664fSBarry Smith   if (reuse == MAT_INPLACE_MATRIX && nr != nc) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
337f8170845SAlex Fikl 
338cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
339f8170845SAlex Fikl     Mat *subs;
340f8170845SAlex Fikl     IS  *is_row,*is_col;
341f8170845SAlex Fikl 
342f8170845SAlex Fikl     ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr);
343f8170845SAlex Fikl     ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr);
344f8170845SAlex Fikl     ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr);
345cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
346ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
347ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
348ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
349ddeb9bd8SAlex Fikl         }
350ddeb9bd8SAlex Fikl       }
351ddeb9bd8SAlex Fikl     }
352ddeb9bd8SAlex Fikl 
353f8170845SAlex Fikl     ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr);
354f8170845SAlex Fikl     ierr = PetscFree(subs);CHKERRQ(ierr);
3553d994f23SBarry Smith     ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr);
356f8170845SAlex Fikl   } else {
357f8170845SAlex Fikl     C = *B;
358f8170845SAlex Fikl   }
359f8170845SAlex Fikl 
360f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
361f8170845SAlex Fikl   for (i=0; i<nr; i++) {
362f8170845SAlex Fikl     for (j=0; j<nc; j++) {
363f8170845SAlex Fikl       if (bA->m[i][j]) {
364f8170845SAlex Fikl         ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr);
365f8170845SAlex Fikl       } else {
366f8170845SAlex Fikl         bC->m[j][i] = NULL;
367f8170845SAlex Fikl       }
368f8170845SAlex Fikl     }
369f8170845SAlex Fikl   }
370f8170845SAlex Fikl 
371cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
372f8170845SAlex Fikl     *B = C;
373f8170845SAlex Fikl   } else {
374f8170845SAlex Fikl     ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr);
375f8170845SAlex Fikl   }
376f8170845SAlex Fikl   PetscFunctionReturn(0);
377f8170845SAlex Fikl }
378f8170845SAlex Fikl 
379e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
380e2d7f03fSJed Brown {
381e2d7f03fSJed Brown   PetscErrorCode ierr;
382e2d7f03fSJed Brown   IS             *lst = *list;
383e2d7f03fSJed Brown   PetscInt       i;
384e2d7f03fSJed Brown 
385e2d7f03fSJed Brown   PetscFunctionBegin;
386e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3876bf464f9SBarry Smith   for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);}
388e2d7f03fSJed Brown   ierr  = PetscFree(lst);CHKERRQ(ierr);
3890298fd71SBarry Smith   *list = NULL;
390e2d7f03fSJed Brown   PetscFunctionReturn(0);
391e2d7f03fSJed Brown }
392e2d7f03fSJed Brown 
39306a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A)
394d8588912SDave May {
395d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
396d8588912SDave May   PetscInt       i,j;
397d8588912SDave May   PetscErrorCode ierr;
398d8588912SDave May 
399d8588912SDave May   PetscFunctionBegin;
400d8588912SDave May   /* release the matrices and the place holders */
401e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr);
402e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr);
403e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
404e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
405d8588912SDave May 
406d8588912SDave May   ierr = PetscFree(vs->row_len);CHKERRQ(ierr);
407d8588912SDave May   ierr = PetscFree(vs->col_len);CHKERRQ(ierr);
40806a1af2fSStefano Zampini   ierr = PetscFree(vs->nnzstate);CHKERRQ(ierr);
409d8588912SDave May 
410207556f9SJed Brown   ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr);
411207556f9SJed Brown 
412d8588912SDave May   /* release the matrices and the place holders */
413d8588912SDave May   if (vs->m) {
414d8588912SDave May     for (i=0; i<vs->nr; i++) {
415d8588912SDave May       for (j=0; j<vs->nc; j++) {
4166bf464f9SBarry Smith         ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr);
417d8588912SDave May       }
418d8588912SDave May       ierr = PetscFree(vs->m[i]);CHKERRQ(ierr);
419d8588912SDave May     }
420d8588912SDave May     ierr = PetscFree(vs->m);CHKERRQ(ierr);
421d8588912SDave May   }
42206a1af2fSStefano Zampini 
42306a1af2fSStefano Zampini   /* restore defaults */
42406a1af2fSStefano Zampini   vs->nr = 0;
42506a1af2fSStefano Zampini   vs->nc = 0;
42606a1af2fSStefano Zampini   vs->splitassembly = PETSC_FALSE;
42706a1af2fSStefano Zampini   PetscFunctionReturn(0);
42806a1af2fSStefano Zampini }
42906a1af2fSStefano Zampini 
43006a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A)
43106a1af2fSStefano Zampini {
43206a1af2fSStefano Zampini   PetscErrorCode ierr;
43306a1af2fSStefano Zampini 
43406a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
435bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
436d8588912SDave May 
437bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",0);CHKERRQ(ierr);
438bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",0);CHKERRQ(ierr);
439bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",0);CHKERRQ(ierr);
440bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",0);CHKERRQ(ierr);
441bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",0);CHKERRQ(ierr);
442bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",0);CHKERRQ(ierr);
443bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",0);CHKERRQ(ierr);
444bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",0);CHKERRQ(ierr);
4450899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",0);CHKERRQ(ierr);
4460899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",0);CHKERRQ(ierr);
4475e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",0);CHKERRQ(ierr);
4485e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",0);CHKERRQ(ierr);
4494222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL);CHKERRQ(ierr);
4504222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL);CHKERRQ(ierr);
4514222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL);CHKERRQ(ierr);
452d8588912SDave May   PetscFunctionReturn(0);
453d8588912SDave May }
454d8588912SDave May 
455381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd)
456381b8e50SStefano Zampini {
457381b8e50SStefano Zampini   Mat_Nest       *vs = (Mat_Nest*)mat->data;
458381b8e50SStefano Zampini   PetscInt       i;
459381b8e50SStefano Zampini   PetscErrorCode ierr;
460381b8e50SStefano Zampini 
461381b8e50SStefano Zampini   PetscFunctionBegin;
462381b8e50SStefano Zampini   if (dd) *dd = 0;
463381b8e50SStefano Zampini   if (!vs->nr) {
464381b8e50SStefano Zampini     *missing = PETSC_TRUE;
465381b8e50SStefano Zampini     PetscFunctionReturn(0);
466381b8e50SStefano Zampini   }
467381b8e50SStefano Zampini   *missing = PETSC_FALSE;
468381b8e50SStefano Zampini   for (i = 0; i < vs->nr && !(*missing); i++) {
469381b8e50SStefano Zampini     *missing = PETSC_TRUE;
470381b8e50SStefano Zampini     if (vs->m[i][i]) {
471381b8e50SStefano Zampini       ierr = MatMissingDiagonal(vs->m[i][i],missing,NULL);CHKERRQ(ierr);
472381b8e50SStefano Zampini       if (*missing && dd) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented");
473381b8e50SStefano Zampini     }
474381b8e50SStefano Zampini   }
475381b8e50SStefano Zampini   PetscFunctionReturn(0);
476381b8e50SStefano Zampini }
477381b8e50SStefano Zampini 
478207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
479d8588912SDave May {
480d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
481d8588912SDave May   PetscInt       i,j;
482d8588912SDave May   PetscErrorCode ierr;
48306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
484d8588912SDave May 
485d8588912SDave May   PetscFunctionBegin;
486d8588912SDave May   for (i=0; i<vs->nr; i++) {
487d8588912SDave May     for (j=0; j<vs->nc; j++) {
48806a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
489e7c19651SJed Brown       if (vs->m[i][j]) {
490e7c19651SJed Brown         ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr);
491e7c19651SJed Brown         if (!vs->splitassembly) {
492e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
493e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
494e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
495e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
496e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
497e7c19651SJed Brown            */
498e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
49906a1af2fSStefano Zampini           ierr = MatGetNonzeroState(vs->m[i][j],&subnnzstate);CHKERRQ(ierr);
500e7c19651SJed Brown         }
501e7c19651SJed Brown       }
50206a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate);
50306a1af2fSStefano Zampini       vs->nnzstate[i*vs->nc+j] = subnnzstate;
504d8588912SDave May     }
505d8588912SDave May   }
50606a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
507d8588912SDave May   PetscFunctionReturn(0);
508d8588912SDave May }
509d8588912SDave May 
510207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
511d8588912SDave May {
512d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
513d8588912SDave May   PetscInt       i,j;
514d8588912SDave May   PetscErrorCode ierr;
515d8588912SDave May 
516d8588912SDave May   PetscFunctionBegin;
517d8588912SDave May   for (i=0; i<vs->nr; i++) {
518d8588912SDave May     for (j=0; j<vs->nc; j++) {
519e7c19651SJed Brown       if (vs->m[i][j]) {
520e7c19651SJed Brown         if (vs->splitassembly) {
521e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
522e7c19651SJed Brown         }
523e7c19651SJed Brown       }
524d8588912SDave May     }
525d8588912SDave May   }
526d8588912SDave May   PetscFunctionReturn(0);
527d8588912SDave May }
528d8588912SDave May 
529f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
530d8588912SDave May {
531207556f9SJed Brown   PetscErrorCode ierr;
532f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
533f349c1fdSJed Brown   PetscInt       j;
534f349c1fdSJed Brown   Mat            sub;
535d8588912SDave May 
536d8588912SDave May   PetscFunctionBegin;
5370298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
538f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
5394994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
540f349c1fdSJed Brown   *B = sub;
541f349c1fdSJed Brown   PetscFunctionReturn(0);
542d8588912SDave May }
543d8588912SDave May 
544f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
545f349c1fdSJed Brown {
546207556f9SJed Brown   PetscErrorCode ierr;
547f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
548f349c1fdSJed Brown   PetscInt       i;
549f349c1fdSJed Brown   Mat            sub;
550f349c1fdSJed Brown 
551f349c1fdSJed Brown   PetscFunctionBegin;
5520298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
553f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
5544994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
555f349c1fdSJed Brown   *B = sub;
556f349c1fdSJed Brown   PetscFunctionReturn(0);
557d8588912SDave May }
558d8588912SDave May 
559f349c1fdSJed Brown static PetscErrorCode MatNestFindIS(Mat A,PetscInt n,const IS list[],IS is,PetscInt *found)
560f349c1fdSJed Brown {
561f349c1fdSJed Brown   PetscErrorCode ierr;
562f349c1fdSJed Brown   PetscInt       i;
563f349c1fdSJed Brown   PetscBool      flg;
564f349c1fdSJed Brown 
565f349c1fdSJed Brown   PetscFunctionBegin;
566f349c1fdSJed Brown   PetscValidPointer(list,3);
567f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
568f349c1fdSJed Brown   PetscValidIntPointer(found,5);
569f349c1fdSJed Brown   *found = -1;
570f349c1fdSJed Brown   for (i=0; i<n; i++) {
571207556f9SJed Brown     if (!list[i]) continue;
572320466b0SStefano Zampini     ierr = ISEqualUnsorted(list[i],is,&flg);CHKERRQ(ierr);
573f349c1fdSJed Brown     if (flg) {
574f349c1fdSJed Brown       *found = i;
575f349c1fdSJed Brown       PetscFunctionReturn(0);
576f349c1fdSJed Brown     }
577f349c1fdSJed Brown   }
578ce94432eSBarry Smith   SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
579f349c1fdSJed Brown   PetscFunctionReturn(0);
580f349c1fdSJed Brown }
581f349c1fdSJed Brown 
5828188e55aSJed Brown /* Get a block row as a new MatNest */
5838188e55aSJed Brown static PetscErrorCode MatNestGetRow(Mat A,PetscInt row,Mat *B)
5848188e55aSJed Brown {
5858188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
5868188e55aSJed Brown   char           keyname[256];
5878188e55aSJed Brown   PetscErrorCode ierr;
5888188e55aSJed Brown 
5898188e55aSJed Brown   PetscFunctionBegin;
5900298fd71SBarry Smith   *B   = NULL;
5918caf3d72SBarry Smith   ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestRow_%D",row);CHKERRQ(ierr);
5928188e55aSJed Brown   ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr);
5938188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
5948188e55aSJed Brown 
595ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),1,NULL,vs->nc,vs->isglobal.col,vs->m[row],B);CHKERRQ(ierr);
59626fbe8dcSKarl Rupp 
5978188e55aSJed Brown   (*B)->assembled = A->assembled;
59826fbe8dcSKarl Rupp 
5998188e55aSJed Brown   ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr);
6008188e55aSJed Brown   ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */
6018188e55aSJed Brown   PetscFunctionReturn(0);
6028188e55aSJed Brown }
6038188e55aSJed Brown 
604f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
605f349c1fdSJed Brown {
606f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
6078188e55aSJed Brown   PetscErrorCode ierr;
6086b3a5b13SJed Brown   PetscInt       row,col;
609e072481dSJed Brown   PetscBool      same,isFullCol,isFullColGlobal;
610f349c1fdSJed Brown 
611f349c1fdSJed Brown   PetscFunctionBegin;
6128188e55aSJed Brown   /* Check if full column space. This is a hack */
6138188e55aSJed Brown   isFullCol = PETSC_FALSE;
614251f4c67SDmitry Karpeev   ierr      = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&same);CHKERRQ(ierr);
6158188e55aSJed Brown   if (same) {
61677019fcaSJed Brown     PetscInt n,first,step,i,an,am,afirst,astep;
6178188e55aSJed Brown     ierr      = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr);
6188188e55aSJed Brown     ierr      = ISGetLocalSize(iscol,&n);CHKERRQ(ierr);
61977019fcaSJed Brown     isFullCol = PETSC_TRUE;
62005ce4453SJed Brown     for (i=0,an=A->cmap->rstart; i<vs->nc; i++) {
62106a1af2fSStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)is->col[i],ISSTRIDE,&same);CHKERRQ(ierr);
62277019fcaSJed Brown       ierr = ISGetLocalSize(is->col[i],&am);CHKERRQ(ierr);
62306a1af2fSStefano Zampini       if (same) {
62406a1af2fSStefano Zampini         ierr = ISStrideGetInfo(is->col[i],&afirst,&astep);CHKERRQ(ierr);
62577019fcaSJed Brown         if (afirst != an || astep != step) isFullCol = PETSC_FALSE;
62606a1af2fSStefano Zampini       } else isFullCol = PETSC_FALSE;
62777019fcaSJed Brown       an += am;
62877019fcaSJed Brown     }
62905ce4453SJed Brown     if (an != A->cmap->rstart+n) isFullCol = PETSC_FALSE;
6308188e55aSJed Brown   }
631b2566f29SBarry Smith   ierr = MPIU_Allreduce(&isFullCol,&isFullColGlobal,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)iscol));CHKERRQ(ierr);
6328188e55aSJed Brown 
633427230ceSLisandro Dalcin   if (isFullColGlobal && vs->nc > 1) {
6348188e55aSJed Brown     PetscInt row;
6358188e55aSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
6368188e55aSJed Brown     ierr = MatNestGetRow(A,row,B);CHKERRQ(ierr);
6378188e55aSJed Brown   } else {
638f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
639f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nc,is->col,iscol,&col);CHKERRQ(ierr);
640b6480e04SStefano Zampini     if (!vs->m[row][col]) {
641b6480e04SStefano Zampini       PetscInt lr,lc;
642b6480e04SStefano Zampini 
643b6480e04SStefano Zampini       ierr = MatCreate(PetscObjectComm((PetscObject)A),&vs->m[row][col]);CHKERRQ(ierr);
644b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.row[row],&lr);CHKERRQ(ierr);
645b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.col[col],&lc);CHKERRQ(ierr);
646b6480e04SStefano Zampini       ierr = MatSetSizes(vs->m[row][col],lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
647fa9f0909SStefano Zampini       ierr = MatSetType(vs->m[row][col],MATAIJ);CHKERRQ(ierr);
648fa9f0909SStefano Zampini       ierr = MatSeqAIJSetPreallocation(vs->m[row][col],0,NULL);CHKERRQ(ierr);
649fa9f0909SStefano Zampini       ierr = MatMPIAIJSetPreallocation(vs->m[row][col],0,NULL,0,NULL);CHKERRQ(ierr);
650b6480e04SStefano Zampini       ierr = MatSetUp(vs->m[row][col]);CHKERRQ(ierr);
651b6480e04SStefano Zampini       ierr = MatAssemblyBegin(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
652b6480e04SStefano Zampini       ierr = MatAssemblyEnd(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
653b6480e04SStefano Zampini     }
654f349c1fdSJed Brown     *B = vs->m[row][col];
6558188e55aSJed Brown   }
656f349c1fdSJed Brown   PetscFunctionReturn(0);
657f349c1fdSJed Brown }
658f349c1fdSJed Brown 
65906a1af2fSStefano Zampini /*
66006a1af2fSStefano Zampini    TODO: This does not actually returns a submatrix we can modify
66106a1af2fSStefano Zampini */
6627dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
663f349c1fdSJed Brown {
664f349c1fdSJed Brown   PetscErrorCode ierr;
665f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
666f349c1fdSJed Brown   Mat            sub;
667f349c1fdSJed Brown 
668f349c1fdSJed Brown   PetscFunctionBegin;
669f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr);
670f349c1fdSJed Brown   switch (reuse) {
671f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
6727874fa86SDave May     if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); }
673f349c1fdSJed Brown     *B = sub;
674f349c1fdSJed Brown     break;
675f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
676ce94432eSBarry Smith     if (sub != *B) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
677f349c1fdSJed Brown     break;
678f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
679f349c1fdSJed Brown     break;
680511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
681511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
682511c6705SHong Zhang     break;
683f349c1fdSJed Brown   }
684f349c1fdSJed Brown   PetscFunctionReturn(0);
685f349c1fdSJed Brown }
686f349c1fdSJed Brown 
687f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
688f349c1fdSJed Brown {
689f349c1fdSJed Brown   PetscErrorCode ierr;
690f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
691f349c1fdSJed Brown   Mat            sub;
692f349c1fdSJed Brown 
693f349c1fdSJed Brown   PetscFunctionBegin;
694f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
695f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
696f349c1fdSJed Brown   if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);}
697f349c1fdSJed Brown   *B = sub;
698d8588912SDave May   PetscFunctionReturn(0);
699d8588912SDave May }
700d8588912SDave May 
701207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
702d8588912SDave May {
703d8588912SDave May   PetscErrorCode ierr;
704f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
705f349c1fdSJed Brown   Mat            sub;
706d8588912SDave May 
707d8588912SDave May   PetscFunctionBegin;
708f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
709ce94432eSBarry Smith   if (*B != sub) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
710f349c1fdSJed Brown   if (sub) {
711ce94432eSBarry Smith     if (((PetscObject)sub)->refct <= 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
7126bf464f9SBarry Smith     ierr = MatDestroy(B);CHKERRQ(ierr);
713d8588912SDave May   }
714d8588912SDave May   PetscFunctionReturn(0);
715d8588912SDave May }
716d8588912SDave May 
7177874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
7187874fa86SDave May {
7197874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
7207874fa86SDave May   PetscInt       i;
7217874fa86SDave May   PetscErrorCode ierr;
7227874fa86SDave May 
7237874fa86SDave May   PetscFunctionBegin;
7247874fa86SDave May   for (i=0; i<bA->nr; i++) {
725429bac76SJed Brown     Vec bv;
726429bac76SJed Brown     ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7277874fa86SDave May     if (bA->m[i][i]) {
728429bac76SJed Brown       ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr);
7297874fa86SDave May     } else {
7305159a857SMatthew G. Knepley       ierr = VecSet(bv,0.0);CHKERRQ(ierr);
7317874fa86SDave May     }
732429bac76SJed Brown     ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7337874fa86SDave May   }
7347874fa86SDave May   PetscFunctionReturn(0);
7357874fa86SDave May }
7367874fa86SDave May 
7377874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
7387874fa86SDave May {
7397874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
740429bac76SJed Brown   Vec            bl,*br;
7417874fa86SDave May   PetscInt       i,j;
7427874fa86SDave May   PetscErrorCode ierr;
7437874fa86SDave May 
7447874fa86SDave May   PetscFunctionBegin;
7453f800ebeSJed Brown   ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr);
7462e6472ebSElliott Sales de Andrade   if (r) {
747429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
7482e6472ebSElliott Sales de Andrade   }
7492e6472ebSElliott Sales de Andrade   bl = NULL;
7507874fa86SDave May   for (i=0; i<bA->nr; i++) {
7512e6472ebSElliott Sales de Andrade     if (l) {
752429bac76SJed Brown       ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
7532e6472ebSElliott Sales de Andrade     }
7547874fa86SDave May     for (j=0; j<bA->nc; j++) {
7557874fa86SDave May       if (bA->m[i][j]) {
756429bac76SJed Brown         ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr);
7577874fa86SDave May       }
7587874fa86SDave May     }
7592e6472ebSElliott Sales de Andrade     if (l) {
760a061e289SJed Brown       ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
7617874fa86SDave May     }
7622e6472ebSElliott Sales de Andrade   }
7632e6472ebSElliott Sales de Andrade   if (r) {
764429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
7652e6472ebSElliott Sales de Andrade   }
766429bac76SJed Brown   ierr = PetscFree(br);CHKERRQ(ierr);
7677874fa86SDave May   PetscFunctionReturn(0);
7687874fa86SDave May }
7697874fa86SDave May 
770a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
771a061e289SJed Brown {
772a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
773a061e289SJed Brown   PetscInt       i,j;
774a061e289SJed Brown   PetscErrorCode ierr;
775a061e289SJed Brown 
776a061e289SJed Brown   PetscFunctionBegin;
777a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
778a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
779a061e289SJed Brown       if (bA->m[i][j]) {
780a061e289SJed Brown         ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr);
781a061e289SJed Brown       }
782a061e289SJed Brown     }
783a061e289SJed Brown   }
784a061e289SJed Brown   PetscFunctionReturn(0);
785a061e289SJed Brown }
786a061e289SJed Brown 
787a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
788a061e289SJed Brown {
789a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
790a061e289SJed Brown   PetscInt       i;
791a061e289SJed Brown   PetscErrorCode ierr;
79206a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
793a061e289SJed Brown 
794a061e289SJed Brown   PetscFunctionBegin;
795a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
79606a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
797ce94432eSBarry Smith     if (!bA->m[i][i]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%D,%D)",i,i);
798a061e289SJed Brown     ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr);
79906a1af2fSStefano Zampini     ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
80006a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
80106a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
802a061e289SJed Brown   }
80306a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
804a061e289SJed Brown   PetscFunctionReturn(0);
805a061e289SJed Brown }
806a061e289SJed Brown 
80713135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
80813135bc6SAlex Fikl {
80913135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
81013135bc6SAlex Fikl   PetscInt       i;
81113135bc6SAlex Fikl   PetscErrorCode ierr;
81206a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
81313135bc6SAlex Fikl 
81413135bc6SAlex Fikl   PetscFunctionBegin;
81513135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
81606a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
81713135bc6SAlex Fikl     Vec              bv;
81813135bc6SAlex Fikl     ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
81913135bc6SAlex Fikl     if (bA->m[i][i]) {
82013135bc6SAlex Fikl       ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr);
82106a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
82213135bc6SAlex Fikl     }
82313135bc6SAlex Fikl     ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
82406a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
82506a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
82613135bc6SAlex Fikl   }
82706a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
82813135bc6SAlex Fikl   PetscFunctionReturn(0);
82913135bc6SAlex Fikl }
83013135bc6SAlex Fikl 
831f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
832f8170845SAlex Fikl {
833f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
834f8170845SAlex Fikl   PetscInt       i,j;
835f8170845SAlex Fikl   PetscErrorCode ierr;
836f8170845SAlex Fikl 
837f8170845SAlex Fikl   PetscFunctionBegin;
838f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
839f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
840f8170845SAlex Fikl       if (bA->m[i][j]) {
841f8170845SAlex Fikl         ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr);
842f8170845SAlex Fikl       }
843f8170845SAlex Fikl     }
844f8170845SAlex Fikl   }
845f8170845SAlex Fikl   PetscFunctionReturn(0);
846f8170845SAlex Fikl }
847f8170845SAlex Fikl 
8482a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
849d8588912SDave May {
850d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
851d8588912SDave May   Vec            *L,*R;
852d8588912SDave May   MPI_Comm       comm;
853d8588912SDave May   PetscInt       i,j;
854d8588912SDave May   PetscErrorCode ierr;
855d8588912SDave May 
856d8588912SDave May   PetscFunctionBegin;
857ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
858d8588912SDave May   if (right) {
859d8588912SDave May     /* allocate R */
860854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr);
861d8588912SDave May     /* Create the right vectors */
862d8588912SDave May     for (j=0; j<bA->nc; j++) {
863d8588912SDave May       for (i=0; i<bA->nr; i++) {
864d8588912SDave May         if (bA->m[i][j]) {
8652a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr);
866d8588912SDave May           break;
867d8588912SDave May         }
868d8588912SDave May       }
8696c4ed002SBarry Smith       if (i==bA->nr) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
870d8588912SDave May     }
871f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr);
872d8588912SDave May     /* hand back control to the nest vector */
873d8588912SDave May     for (j=0; j<bA->nc; j++) {
8746bf464f9SBarry Smith       ierr = VecDestroy(&R[j]);CHKERRQ(ierr);
875d8588912SDave May     }
876d8588912SDave May     ierr = PetscFree(R);CHKERRQ(ierr);
877d8588912SDave May   }
878d8588912SDave May 
879d8588912SDave May   if (left) {
880d8588912SDave May     /* allocate L */
881854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr);
882d8588912SDave May     /* Create the left vectors */
883d8588912SDave May     for (i=0; i<bA->nr; i++) {
884d8588912SDave May       for (j=0; j<bA->nc; j++) {
885d8588912SDave May         if (bA->m[i][j]) {
8862a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr);
887d8588912SDave May           break;
888d8588912SDave May         }
889d8588912SDave May       }
8906c4ed002SBarry Smith       if (j==bA->nc) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
891d8588912SDave May     }
892d8588912SDave May 
893f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr);
894d8588912SDave May     for (i=0; i<bA->nr; i++) {
8956bf464f9SBarry Smith       ierr = VecDestroy(&L[i]);CHKERRQ(ierr);
896d8588912SDave May     }
897d8588912SDave May 
898d8588912SDave May     ierr = PetscFree(L);CHKERRQ(ierr);
899d8588912SDave May   }
900d8588912SDave May   PetscFunctionReturn(0);
901d8588912SDave May }
902d8588912SDave May 
903207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
904d8588912SDave May {
905d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
90629e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
907d8588912SDave May   PetscInt       i,j;
908d8588912SDave May   PetscErrorCode ierr;
909d8588912SDave May 
910d8588912SDave May   PetscFunctionBegin;
911251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
912d8588912SDave May   if (isascii) {
913d8588912SDave May 
91429e60adbSStefano Zampini     ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr);
915d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr);
916d86155a6SBarry Smith     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
917d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%D, cols=%D \n",bA->nr,bA->nc);CHKERRQ(ierr);
918d8588912SDave May 
919d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr);
920d8588912SDave May     for (i=0; i<bA->nr; i++) {
921d8588912SDave May       for (j=0; j<bA->nc; j++) {
92219fd82e9SBarry Smith         MatType   type;
923270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
924d8588912SDave May         PetscInt  NR,NC;
925d8588912SDave May         PetscBool isNest = PETSC_FALSE;
926d8588912SDave May 
927d8588912SDave May         if (!bA->m[i][j]) {
928d86155a6SBarry Smith           CHKERRQ(ierr);PetscViewerASCIIPrintf(viewer, "(%D,%D) : NULL \n",i,j);CHKERRQ(ierr);
929d8588912SDave May           continue;
930d8588912SDave May         }
931d8588912SDave May         ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr);
932d8588912SDave May         ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr);
9338caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);}
9348caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);}
935251f4c67SDmitry Karpeev         ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr);
936d8588912SDave May 
937270f95d7SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"(%D,%D) : %s%stype=%s, rows=%D, cols=%D \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr);
938d8588912SDave May 
93929e60adbSStefano Zampini         if (isNest || viewSub) {
940270f95d7SJed Brown           ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);  /* push1 */
941d8588912SDave May           ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr);
942270f95d7SJed Brown           ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop1 */
943d8588912SDave May         }
944d8588912SDave May       }
945d8588912SDave May     }
946d86155a6SBarry Smith     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop0 */
947d8588912SDave May   }
948d8588912SDave May   PetscFunctionReturn(0);
949d8588912SDave May }
950d8588912SDave May 
951207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
952d8588912SDave May {
953d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
954d8588912SDave May   PetscInt       i,j;
955d8588912SDave May   PetscErrorCode ierr;
956d8588912SDave May 
957d8588912SDave May   PetscFunctionBegin;
958d8588912SDave May   for (i=0; i<bA->nr; i++) {
959d8588912SDave May     for (j=0; j<bA->nc; j++) {
960d8588912SDave May       if (!bA->m[i][j]) continue;
961d8588912SDave May       ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr);
962d8588912SDave May     }
963d8588912SDave May   }
964d8588912SDave May   PetscFunctionReturn(0);
965d8588912SDave May }
966d8588912SDave May 
967c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
968c222c20dSDavid Ham {
969c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
970c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
971c222c20dSDavid Ham   PetscErrorCode ierr;
97206a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
973c222c20dSDavid Ham 
974c222c20dSDavid Ham   PetscFunctionBegin;
975c222c20dSDavid Ham   if (nr != bB->nr || nc != bB->nc) SETERRQ4(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%D,%D) to a Mat_Nest of block size (%D,%D)",bB->nr,bB->nc,nr,nc);
976c222c20dSDavid Ham   for (i=0; i<nr; i++) {
977c222c20dSDavid Ham     for (j=0; j<nc; j++) {
97806a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
97946a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
980c222c20dSDavid Ham         ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr);
98146a2b97cSJed Brown       } else if (bA->m[i][j] || bB->m[i][j]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
98206a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bB->m[i][j],&subnnzstate);CHKERRQ(ierr);
98306a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate);
98406a1af2fSStefano Zampini       bB->nnzstate[i*nc+j] = subnnzstate;
985c222c20dSDavid Ham     }
986c222c20dSDavid Ham   }
98706a1af2fSStefano Zampini   if (nnzstate) B->nonzerostate++;
988c222c20dSDavid Ham   PetscFunctionReturn(0);
989c222c20dSDavid Ham }
990c222c20dSDavid Ham 
9916e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
9926e76ffeaSPierre Jolivet {
9936e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
9946e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
9956e76ffeaSPierre Jolivet   PetscErrorCode ierr;
99606a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
9976e76ffeaSPierre Jolivet 
9986e76ffeaSPierre Jolivet   PetscFunctionBegin;
9996e76ffeaSPierre Jolivet   if (nr != bX->nr || nc != bX->nc) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%D,%D) with a MatNest of block size (%D,%D)",bX->nr,bX->nc,nr,nc);
10006e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
10016e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
100206a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
10036e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
10046e76ffeaSPierre Jolivet         ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr);
1005c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
1006c066aebcSStefano Zampini         Mat M;
1007c066aebcSStefano Zampini 
1008060bfc19SStefano Zampini         if (str != DIFFERENT_NONZERO_PATTERN) SETERRQ2(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D. Use DIFFERENT_NONZERO_PATTERN",i,j);
1009c066aebcSStefano Zampini         ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr);
1010c066aebcSStefano Zampini         ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr);
1011c066aebcSStefano Zampini         ierr = MatDestroy(&M);CHKERRQ(ierr);
1012c066aebcSStefano Zampini       }
1013060bfc19SStefano Zampini       if (bY->m[i][j]) { ierr = MatGetNonzeroState(bY->m[i][j],&subnnzstate);CHKERRQ(ierr); }
101406a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate);
101506a1af2fSStefano Zampini       bY->nnzstate[i*nc+j] = subnnzstate;
10166e76ffeaSPierre Jolivet     }
10176e76ffeaSPierre Jolivet   }
101806a1af2fSStefano Zampini   if (nnzstate) Y->nonzerostate++;
10196e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
10206e76ffeaSPierre Jolivet }
10216e76ffeaSPierre Jolivet 
1022207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
1023d8588912SDave May {
1024d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1025841e96a3SJed Brown   Mat            *b;
1026841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1027d8588912SDave May   PetscErrorCode ierr;
1028d8588912SDave May 
1029d8588912SDave May   PetscFunctionBegin;
1030785e854fSJed Brown   ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr);
1031841e96a3SJed Brown   for (i=0; i<nr; i++) {
1032841e96a3SJed Brown     for (j=0; j<nc; j++) {
1033841e96a3SJed Brown       if (bA->m[i][j]) {
1034841e96a3SJed Brown         ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr);
1035841e96a3SJed Brown       } else {
10360298fd71SBarry Smith         b[i*nc+j] = NULL;
1037d8588912SDave May       }
1038d8588912SDave May     }
1039d8588912SDave May   }
1040ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr);
1041841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
1042841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
10436bf464f9SBarry Smith     ierr = MatDestroy(&b[i]);CHKERRQ(ierr);
1044d8588912SDave May   }
1045d8588912SDave May   ierr = PetscFree(b);CHKERRQ(ierr);
1046d8588912SDave May 
1047841e96a3SJed Brown   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1048841e96a3SJed Brown   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1049d8588912SDave May   PetscFunctionReturn(0);
1050d8588912SDave May }
1051d8588912SDave May 
1052d8588912SDave May /* nest api */
1053d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
1054d8588912SDave May {
1055d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
10565fd66863SKarl Rupp 
1057d8588912SDave May   PetscFunctionBegin;
1058ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1059ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
1060d8588912SDave May   *mat = bA->m[idxm][jdxm];
1061d8588912SDave May   PetscFunctionReturn(0);
1062d8588912SDave May }
1063d8588912SDave May 
10649ba0d327SJed Brown /*@
1065d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
1066d8588912SDave May 
1067d8588912SDave May  Not collective
1068d8588912SDave May 
1069d8588912SDave May  Input Parameters:
1070629881c0SJed Brown +   A  - nest matrix
1071d8588912SDave May .   idxm - index of the matrix within the nest matrix
1072629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
1073d8588912SDave May 
1074d8588912SDave May  Output Parameter:
1075d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
1076d8588912SDave May 
1077d8588912SDave May  Level: developer
1078d8588912SDave May 
1079bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(),
108079798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
1081d8588912SDave May @*/
10827087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
1083d8588912SDave May {
1084699a902aSJed Brown   PetscErrorCode ierr;
1085d8588912SDave May 
1086d8588912SDave May   PetscFunctionBegin;
1087699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr);
1088d8588912SDave May   PetscFunctionReturn(0);
1089d8588912SDave May }
1090d8588912SDave May 
10910782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
10920782ca92SJed Brown {
10930782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
10940782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
10950782ca92SJed Brown   PetscErrorCode ierr;
10960782ca92SJed Brown 
10970782ca92SJed Brown   PetscFunctionBegin;
1098ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1099ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
11000782ca92SJed Brown   ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr);
11010782ca92SJed Brown   ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr);
11020782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr);
11030782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr);
11040782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr);
11050782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr);
1106ce94432eSBarry Smith   if (M != Mi || N != Ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%D,%D) incompatible with nest block (%D,%D)",M,N,Mi,Ni);
1107ce94432eSBarry Smith   if (m != mi || n != ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%D,%D) incompatible with nest block (%D,%D)",m,n,mi,ni);
110826fbe8dcSKarl Rupp 
110906a1af2fSStefano Zampini   /* do not increase object state */
111006a1af2fSStefano Zampini   if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0);
111106a1af2fSStefano Zampini 
11120782ca92SJed Brown   ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr);
11130782ca92SJed Brown   ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr);
11140782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
111506a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
111606a1af2fSStefano Zampini   ierr = MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]);CHKERRQ(ierr);
111706a1af2fSStefano Zampini   A->nonzerostate++;
11180782ca92SJed Brown   PetscFunctionReturn(0);
11190782ca92SJed Brown }
11200782ca92SJed Brown 
11219ba0d327SJed Brown /*@
11220782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
11230782ca92SJed Brown 
11240782ca92SJed Brown  Logically collective on the submatrix communicator
11250782ca92SJed Brown 
11260782ca92SJed Brown  Input Parameters:
11270782ca92SJed Brown +   A  - nest matrix
11280782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
11290782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
11300782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
11310782ca92SJed Brown 
11320782ca92SJed Brown  Notes:
11330782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
11340782ca92SJed Brown 
11350782ca92SJed Brown  This increments the reference count of the submatrix.
11360782ca92SJed Brown 
11370782ca92SJed Brown  Level: developer
11380782ca92SJed Brown 
1139bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
114079798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
11410782ca92SJed Brown @*/
11420782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
11430782ca92SJed Brown {
11440782ca92SJed Brown   PetscErrorCode ierr;
11450782ca92SJed Brown 
11460782ca92SJed Brown   PetscFunctionBegin;
11470782ca92SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr);
11480782ca92SJed Brown   PetscFunctionReturn(0);
11490782ca92SJed Brown }
11500782ca92SJed Brown 
1151d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1152d8588912SDave May {
1153d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
11545fd66863SKarl Rupp 
1155d8588912SDave May   PetscFunctionBegin;
115626fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
115726fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
115826fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1159d8588912SDave May   PetscFunctionReturn(0);
1160d8588912SDave May }
1161d8588912SDave May 
1162d8588912SDave May /*@C
1163d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1164d8588912SDave May 
1165d8588912SDave May  Not collective
1166d8588912SDave May 
1167d8588912SDave May  Input Parameters:
1168629881c0SJed Brown .   A  - nest matrix
1169d8588912SDave May 
1170d8588912SDave May  Output Parameter:
1171629881c0SJed Brown +   M - number of rows in the nest matrix
1172d8588912SDave May .   N - number of cols in the nest matrix
1173629881c0SJed Brown -   mat - 2d array of matrices
1174d8588912SDave May 
1175d8588912SDave May  Notes:
1176d8588912SDave May 
1177d8588912SDave May  The user should not free the array mat.
1178d8588912SDave May 
1179351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1180351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1181351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1182351962e3SVincent Le Chenadec 
1183d8588912SDave May  Level: developer
1184d8588912SDave May 
1185bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
118679798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1187d8588912SDave May @*/
11887087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1189d8588912SDave May {
1190699a902aSJed Brown   PetscErrorCode ierr;
1191d8588912SDave May 
1192d8588912SDave May   PetscFunctionBegin;
1193699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr);
1194d8588912SDave May   PetscFunctionReturn(0);
1195d8588912SDave May }
1196d8588912SDave May 
11977087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1198d8588912SDave May {
1199d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1200d8588912SDave May 
1201d8588912SDave May   PetscFunctionBegin;
120226fbe8dcSKarl Rupp   if (M) *M = bA->nr;
120326fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1204d8588912SDave May   PetscFunctionReturn(0);
1205d8588912SDave May }
1206d8588912SDave May 
12079ba0d327SJed Brown /*@
1208d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1209d8588912SDave May 
1210d8588912SDave May  Not collective
1211d8588912SDave May 
1212d8588912SDave May  Input Parameters:
1213d8588912SDave May .   A  - nest matrix
1214d8588912SDave May 
1215d8588912SDave May  Output Parameter:
1216629881c0SJed Brown +   M - number of rows in the nested mat
1217629881c0SJed Brown -   N - number of cols in the nested mat
1218d8588912SDave May 
1219d8588912SDave May  Notes:
1220d8588912SDave May 
1221d8588912SDave May  Level: developer
1222d8588912SDave May 
1223bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(),
122479798668SBarry Smith           MatNestGetISs()
1225d8588912SDave May @*/
12267087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1227d8588912SDave May {
1228699a902aSJed Brown   PetscErrorCode ierr;
1229d8588912SDave May 
1230d8588912SDave May   PetscFunctionBegin;
1231699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr);
1232d8588912SDave May   PetscFunctionReturn(0);
1233d8588912SDave May }
1234d8588912SDave May 
1235f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1236900e7ff2SJed Brown {
1237900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1238900e7ff2SJed Brown   PetscInt i;
1239900e7ff2SJed Brown 
1240900e7ff2SJed Brown   PetscFunctionBegin;
1241900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1242900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1243900e7ff2SJed Brown   PetscFunctionReturn(0);
1244900e7ff2SJed Brown }
1245900e7ff2SJed Brown 
12463a4d7b9aSSatish Balay /*@C
1247900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1248900e7ff2SJed Brown 
1249900e7ff2SJed Brown  Not collective
1250900e7ff2SJed Brown 
1251900e7ff2SJed Brown  Input Parameters:
1252900e7ff2SJed Brown .   A  - nest matrix
1253900e7ff2SJed Brown 
1254900e7ff2SJed Brown  Output Parameter:
1255900e7ff2SJed Brown +   rows - array of row index sets
1256900e7ff2SJed Brown -   cols - array of column index sets
1257900e7ff2SJed Brown 
1258900e7ff2SJed Brown  Level: advanced
1259900e7ff2SJed Brown 
1260900e7ff2SJed Brown  Notes:
1261900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1262900e7ff2SJed Brown 
126379798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1264bb97c47cSPierre Jolivet           MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats()
1265900e7ff2SJed Brown @*/
1266900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1267900e7ff2SJed Brown {
1268900e7ff2SJed Brown   PetscErrorCode ierr;
1269900e7ff2SJed Brown 
1270900e7ff2SJed Brown   PetscFunctionBegin;
1271900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1272900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1273900e7ff2SJed Brown   PetscFunctionReturn(0);
1274900e7ff2SJed Brown }
1275900e7ff2SJed Brown 
1276f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1277900e7ff2SJed Brown {
1278900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1279900e7ff2SJed Brown   PetscInt i;
1280900e7ff2SJed Brown 
1281900e7ff2SJed Brown   PetscFunctionBegin;
1282900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1283900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1284900e7ff2SJed Brown   PetscFunctionReturn(0);
1285900e7ff2SJed Brown }
1286900e7ff2SJed Brown 
1287900e7ff2SJed Brown /*@C
1288900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1289900e7ff2SJed Brown 
1290900e7ff2SJed Brown  Not collective
1291900e7ff2SJed Brown 
1292900e7ff2SJed Brown  Input Parameters:
1293900e7ff2SJed Brown .   A  - nest matrix
1294900e7ff2SJed Brown 
1295900e7ff2SJed Brown  Output Parameter:
12960298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
12970298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1298900e7ff2SJed Brown 
1299900e7ff2SJed Brown  Level: advanced
1300900e7ff2SJed Brown 
1301900e7ff2SJed Brown  Notes:
1302900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1303900e7ff2SJed Brown 
1304bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(),
130579798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1306900e7ff2SJed Brown @*/
1307900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1308900e7ff2SJed Brown {
1309900e7ff2SJed Brown   PetscErrorCode ierr;
1310900e7ff2SJed Brown 
1311900e7ff2SJed Brown   PetscFunctionBegin;
1312900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1313900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1314900e7ff2SJed Brown   PetscFunctionReturn(0);
1315900e7ff2SJed Brown }
1316900e7ff2SJed Brown 
131719fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1318207556f9SJed Brown {
1319207556f9SJed Brown   PetscErrorCode ierr;
1320207556f9SJed Brown   PetscBool      flg;
1321207556f9SJed Brown 
1322207556f9SJed Brown   PetscFunctionBegin;
1323207556f9SJed Brown   ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr);
1324207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
13252a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
132612b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1327207556f9SJed Brown   PetscFunctionReturn(0);
1328207556f9SJed Brown }
1329207556f9SJed Brown 
1330207556f9SJed Brown /*@C
13312a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1332207556f9SJed Brown 
1333207556f9SJed Brown  Not collective
1334207556f9SJed Brown 
1335207556f9SJed Brown  Input Parameters:
1336207556f9SJed Brown +  A  - nest matrix
1337207556f9SJed Brown -  vtype - type to use for creating vectors
1338207556f9SJed Brown 
1339207556f9SJed Brown  Notes:
1340207556f9SJed Brown 
1341207556f9SJed Brown  Level: developer
1342207556f9SJed Brown 
1343bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest()
1344207556f9SJed Brown @*/
134519fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1346207556f9SJed Brown {
1347207556f9SJed Brown   PetscErrorCode ierr;
1348207556f9SJed Brown 
1349207556f9SJed Brown   PetscFunctionBegin;
135019fd82e9SBarry Smith   ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr);
1351207556f9SJed Brown   PetscFunctionReturn(0);
1352207556f9SJed Brown }
1353207556f9SJed Brown 
1354c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1355d8588912SDave May {
1356c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1357c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
1358d8588912SDave May   PetscErrorCode ierr;
135906a1af2fSStefano Zampini   PetscBool      cong;
1360d8588912SDave May 
1361d8588912SDave May   PetscFunctionBegin;
136206a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
136306a1af2fSStefano Zampini 
1364c8883902SJed Brown   s->nr = nr;
1365c8883902SJed Brown   s->nc = nc;
1366d8588912SDave May 
1367c8883902SJed Brown   /* Create space for submatrices */
1368854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr);
1369c8883902SJed Brown   for (i=0; i<nr; i++) {
1370854ce69bSBarry Smith     ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr);
1371d8588912SDave May   }
1372c8883902SJed Brown   for (i=0; i<nr; i++) {
1373c8883902SJed Brown     for (j=0; j<nc; j++) {
1374c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1375c8883902SJed Brown       if (a[i*nc+j]) {
1376c8883902SJed Brown         ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr);
1377d8588912SDave May       }
1378d8588912SDave May     }
1379d8588912SDave May   }
1380d8588912SDave May 
13818188e55aSJed Brown   ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr);
1382d8588912SDave May 
1383854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr);
1384854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr);
1385c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1386c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1387d8588912SDave May 
138806a1af2fSStefano Zampini   ierr = PetscCalloc1(nr*nc,&s->nnzstate);CHKERRQ(ierr);
138906a1af2fSStefano Zampini   for (i=0; i<nr; i++) {
139006a1af2fSStefano Zampini     for (j=0; j<nc; j++) {
139106a1af2fSStefano Zampini       if (s->m[i][j]) {
139206a1af2fSStefano Zampini         ierr = MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]);CHKERRQ(ierr);
139306a1af2fSStefano Zampini       }
139406a1af2fSStefano Zampini     }
139506a1af2fSStefano Zampini   }
139606a1af2fSStefano Zampini 
13978188e55aSJed Brown   ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr);
1398d8588912SDave May 
1399c8883902SJed Brown   ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr);
1400c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr);
1401c8883902SJed Brown   ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr);
1402c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr);
1403c8883902SJed Brown 
1404c8883902SJed Brown   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
1405c8883902SJed Brown   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
1406c8883902SJed Brown 
140706a1af2fSStefano Zampini   /* disable operations that are not supported for non-square matrices,
140806a1af2fSStefano Zampini      or matrices for which is_row != is_col  */
140906a1af2fSStefano Zampini   ierr = MatHasCongruentLayouts(A,&cong);CHKERRQ(ierr);
141006a1af2fSStefano Zampini   if (cong && nr != nc) cong = PETSC_FALSE;
141106a1af2fSStefano Zampini   if (cong) {
141206a1af2fSStefano Zampini     for (i = 0; cong && i < nr; i++) {
1413320466b0SStefano Zampini       ierr = ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong);CHKERRQ(ierr);
141406a1af2fSStefano Zampini     }
141506a1af2fSStefano Zampini   }
141606a1af2fSStefano Zampini   if (!cong) {
1417381b8e50SStefano Zampini     A->ops->missingdiagonal = NULL;
141806a1af2fSStefano Zampini     A->ops->getdiagonal     = NULL;
141906a1af2fSStefano Zampini     A->ops->shift           = NULL;
142006a1af2fSStefano Zampini     A->ops->diagonalset     = NULL;
142106a1af2fSStefano Zampini   }
142206a1af2fSStefano Zampini 
14231795a4d1SJed Brown   ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr);
142406a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
142506a1af2fSStefano Zampini   A->nonzerostate++;
1426d8588912SDave May   PetscFunctionReturn(0);
1427d8588912SDave May }
1428d8588912SDave May 
1429c8883902SJed Brown /*@
1430c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1431c8883902SJed Brown 
1432c8883902SJed Brown    Collective on Mat
1433c8883902SJed Brown 
1434c8883902SJed Brown    Input Parameter:
1435ffd6319bSRichard Tran Mills +  A - nested matrix
1436c8883902SJed Brown .  nr - number of nested row blocks
14370298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1438c8883902SJed Brown .  nc - number of nested column blocks
14390298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
14400298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1441c8883902SJed Brown 
144206a1af2fSStefano Zampini    Notes: this always resets any submatrix information previously set
144306a1af2fSStefano Zampini 
1444c8883902SJed Brown    Level: advanced
1445c8883902SJed Brown 
144679798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1447c8883902SJed Brown @*/
1448c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1449c8883902SJed Brown {
1450c8883902SJed Brown   PetscErrorCode ierr;
145106a1af2fSStefano Zampini   PetscInt       i;
1452c8883902SJed Brown 
1453c8883902SJed Brown   PetscFunctionBegin;
1454c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1455ce94432eSBarry Smith   if (nr < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1456c8883902SJed Brown   if (nr && is_row) {
1457c8883902SJed Brown     PetscValidPointer(is_row,3);
1458c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1459c8883902SJed Brown   }
1460ce94432eSBarry Smith   if (nc < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
14611664e352SJed Brown   if (nc && is_col) {
1462c8883902SJed Brown     PetscValidPointer(is_col,5);
14639b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1464c8883902SJed Brown   }
146506a1af2fSStefano Zampini   if (nr*nc > 0) PetscValidPointer(a,6);
1466c8883902SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr);
1467c8883902SJed Brown   PetscFunctionReturn(0);
1468c8883902SJed Brown }
1469d8588912SDave May 
147045b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
147177019fcaSJed Brown {
147277019fcaSJed Brown   PetscErrorCode ierr;
147377019fcaSJed Brown   PetscBool      flg;
147477019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
147577019fcaSJed Brown 
147677019fcaSJed Brown   PetscFunctionBegin;
1477aea6d515SStefano Zampini   *ltog = NULL;
147877019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
147977019fcaSJed Brown     if (islocal[i]) {
1480aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
148177019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
148277019fcaSJed Brown     } else {
1483aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
148477019fcaSJed Brown     }
148577019fcaSJed Brown     m += mi;
148677019fcaSJed Brown   }
1487aea6d515SStefano Zampini   if (!flg) PetscFunctionReturn(0);
1488aea6d515SStefano Zampini 
1489785e854fSJed Brown   ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr);
1490165cd838SBarry Smith   for (i=0,m=0; i<n; i++) {
14910298fd71SBarry Smith     ISLocalToGlobalMapping smap = NULL;
1492e108cb99SStefano Zampini     Mat                    sub = NULL;
1493f6d38dbbSStefano Zampini     PetscSF                sf;
1494f6d38dbbSStefano Zampini     PetscLayout            map;
1495aea6d515SStefano Zampini     const PetscInt         *ix2;
149677019fcaSJed Brown 
1497165cd838SBarry Smith     if (!colflg) {
149877019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
149977019fcaSJed Brown     } else {
150077019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
150177019fcaSJed Brown     }
1502191fd14bSBarry Smith     if (sub) {
1503191fd14bSBarry Smith       if (!colflg) {
1504191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr);
1505191fd14bSBarry Smith       } else {
1506191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr);
1507191fd14bSBarry Smith       }
1508191fd14bSBarry Smith     }
150977019fcaSJed Brown     /*
151077019fcaSJed Brown        Now we need to extract the monolithic global indices that correspond to the given split global indices.
151177019fcaSJed Brown        In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
151277019fcaSJed Brown     */
1513aea6d515SStefano Zampini     ierr = ISGetIndices(isglobal[i],&ix2);CHKERRQ(ierr);
1514aea6d515SStefano Zampini     if (islocal[i]) {
1515aea6d515SStefano Zampini       PetscInt *ilocal,*iremote;
1516aea6d515SStefano Zampini       PetscInt mil,nleaves;
1517aea6d515SStefano Zampini 
1518aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
1519aea6d515SStefano Zampini       if (!smap) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map");
1520aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = j;
1521aea6d515SStefano Zampini       ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr);
1522aea6d515SStefano Zampini 
1523aea6d515SStefano Zampini       /* PetscSFSetGraphLayout does not like negative indices */
1524aea6d515SStefano Zampini       ierr = PetscMalloc2(mi,&ilocal,mi,&iremote);CHKERRQ(ierr);
1525aea6d515SStefano Zampini       for (j=0, nleaves = 0; j<mi; j++) {
1526aea6d515SStefano Zampini         if (ix[m+j] < 0) continue;
1527aea6d515SStefano Zampini         ilocal[nleaves]  = j;
1528aea6d515SStefano Zampini         iremote[nleaves] = ix[m+j];
1529aea6d515SStefano Zampini         nleaves++;
1530aea6d515SStefano Zampini       }
1531aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mil);CHKERRQ(ierr);
1532aea6d515SStefano Zampini       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A),&sf);CHKERRQ(ierr);
1533aea6d515SStefano Zampini       ierr = PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map);CHKERRQ(ierr);
1534aea6d515SStefano Zampini       ierr = PetscLayoutSetLocalSize(map,mil);CHKERRQ(ierr);
1535f6d38dbbSStefano Zampini       ierr = PetscLayoutSetUp(map);CHKERRQ(ierr);
1536aea6d515SStefano Zampini       ierr = PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote);CHKERRQ(ierr);
1537f6d38dbbSStefano Zampini       ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr);
1538f6d38dbbSStefano Zampini       ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1539f6d38dbbSStefano Zampini       ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1540f6d38dbbSStefano Zampini       ierr = PetscSFDestroy(&sf);CHKERRQ(ierr);
1541aea6d515SStefano Zampini       ierr = PetscFree2(ilocal,iremote);CHKERRQ(ierr);
1542aea6d515SStefano Zampini     } else {
1543aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
1544aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = ix2[i];
1545aea6d515SStefano Zampini     }
1546aea6d515SStefano Zampini     ierr = ISRestoreIndices(isglobal[i],&ix2);CHKERRQ(ierr);
154777019fcaSJed Brown     m   += mi;
154877019fcaSJed Brown   }
1549f0413b6fSBarry Smith   ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr);
155077019fcaSJed Brown   PetscFunctionReturn(0);
155177019fcaSJed Brown }
155277019fcaSJed Brown 
155377019fcaSJed Brown 
1554d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1555d8588912SDave May /*
1556d8588912SDave May   nprocessors = NP
1557d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1558d8588912SDave May        proc 0: => (g_0,h_0,)
1559d8588912SDave May        proc 1: => (g_1,h_1,)
1560d8588912SDave May        ...
1561d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1562d8588912SDave May 
1563d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1564d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1565d8588912SDave May 
1566d8588912SDave May             proc 0:
1567d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1568d8588912SDave May             proc 1:
1569d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1570d8588912SDave May 
1571d8588912SDave May             proc NP-1:
1572d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1573d8588912SDave May */
1574841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1575d8588912SDave May {
1576e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
15778188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
1578d8588912SDave May   PetscErrorCode ierr;
15790298fd71SBarry Smith   Mat            sub = NULL;
1580d8588912SDave May 
1581d8588912SDave May   PetscFunctionBegin;
1582854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr);
1583854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr);
1584d8588912SDave May   if (is_row) { /* valid IS is passed in */
1585d8588912SDave May     /* refs on is[] are incremeneted */
1586e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1587d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr);
158826fbe8dcSKarl Rupp 
1589e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1590d8588912SDave May     }
15912ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
15928188e55aSJed Brown     nsum = 0;
15938188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
15948188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
1595ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %D",i);
15960298fd71SBarry Smith       ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
1597ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
15988188e55aSJed Brown       nsum += n;
15998188e55aSJed Brown     }
1600ce94432eSBarry Smith     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRQ(ierr);
160130bc264bSJed Brown     offset -= nsum;
1602e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1603f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16040298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
160573b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1606ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr);
1607e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr);
16082ae74bdbSJed Brown       offset += n;
1609d8588912SDave May     }
1610d8588912SDave May   }
1611d8588912SDave May 
1612d8588912SDave May   if (is_col) { /* valid IS is passed in */
1613d8588912SDave May     /* refs on is[] are incremeneted */
1614e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1615d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr);
161626fbe8dcSKarl Rupp 
1617e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1618d8588912SDave May     }
16192ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
16202ae74bdbSJed Brown     offset = A->cmap->rstart;
16218188e55aSJed Brown     nsum   = 0;
16228188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
16238188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
1624ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %D",i);
16250298fd71SBarry Smith       ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
1626ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16278188e55aSJed Brown       nsum += n;
16288188e55aSJed Brown     }
1629ce94432eSBarry Smith     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRQ(ierr);
163030bc264bSJed Brown     offset -= nsum;
1631e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1632f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
16330298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
163473b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1635ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr);
1636e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr);
16372ae74bdbSJed Brown       offset += n;
1638d8588912SDave May     }
1639d8588912SDave May   }
1640e2d7f03fSJed Brown 
1641e2d7f03fSJed Brown   /* Set up the local ISs */
1642785e854fSJed Brown   ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
1643785e854fSJed Brown   ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
1644e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1645e2d7f03fSJed Brown     IS                     isloc;
16460298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1647e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1648e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16490298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);}
1650207556f9SJed Brown     if (rmap) {
165173b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1652e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr);
1653e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1654e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1655207556f9SJed Brown     } else {
1656207556f9SJed Brown       nlocal = 0;
16570298fd71SBarry Smith       isloc  = NULL;
1658207556f9SJed Brown     }
1659e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1660e2d7f03fSJed Brown     offset            += nlocal;
1661e2d7f03fSJed Brown   }
16628188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1663e2d7f03fSJed Brown     IS                     isloc;
16640298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1665e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1666e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
16670298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);}
1668207556f9SJed Brown     if (cmap) {
166973b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1670e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr);
1671e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1672e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1673207556f9SJed Brown     } else {
1674207556f9SJed Brown       nlocal = 0;
16750298fd71SBarry Smith       isloc  = NULL;
1676207556f9SJed Brown     }
1677e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1678e2d7f03fSJed Brown     offset            += nlocal;
1679e2d7f03fSJed Brown   }
16800189643fSJed Brown 
168177019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
168277019fcaSJed Brown   {
168345b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
168445b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr);
168545b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr);
168677019fcaSJed Brown     if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);}
168777019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr);
168877019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr);
168977019fcaSJed Brown   }
169077019fcaSJed Brown 
169176bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
16920189643fSJed Brown     for (i=0; i<vs->nr; i++) {
16930189643fSJed Brown       for (j=0; j<vs->nc; j++) {
16940189643fSJed Brown         PetscInt m,n,M,N,mi,ni,Mi,Ni;
16950189643fSJed Brown         Mat      B = vs->m[i][j];
16960189643fSJed Brown         if (!B) continue;
16970189643fSJed Brown         ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr);
16980189643fSJed Brown         ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr);
16990189643fSJed Brown         ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr);
17000189643fSJed Brown         ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr);
17010189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr);
17020189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr);
1703ce94432eSBarry Smith         if (M != Mi || N != Ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",M,N,i,j,Mi,Ni);
1704ce94432eSBarry Smith         if (m != mi || n != ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",m,n,i,j,mi,ni);
17050189643fSJed Brown       }
17060189643fSJed Brown     }
170776bd3646SJed Brown   }
1708a061e289SJed Brown 
1709a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1710a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1711a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1712a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1713a061e289SJed Brown     }
1714a061e289SJed Brown   }
1715a061e289SJed Brown   A->assembled = PETSC_TRUE;
1716d8588912SDave May   PetscFunctionReturn(0);
1717d8588912SDave May }
1718d8588912SDave May 
171945c38901SJed Brown /*@C
1720659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1721659c6bb0SJed Brown 
1722659c6bb0SJed Brown    Collective on Mat
1723659c6bb0SJed Brown 
1724659c6bb0SJed Brown    Input Parameter:
1725659c6bb0SJed Brown +  comm - Communicator for the new Mat
1726659c6bb0SJed Brown .  nr - number of nested row blocks
17270298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1728659c6bb0SJed Brown .  nc - number of nested column blocks
17290298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
17300298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1731659c6bb0SJed Brown 
1732659c6bb0SJed Brown    Output Parameter:
1733659c6bb0SJed Brown .  B - new matrix
1734659c6bb0SJed Brown 
1735659c6bb0SJed Brown    Level: advanced
1736659c6bb0SJed Brown 
173779798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
173879798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
173979798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1740659c6bb0SJed Brown @*/
17417087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1742d8588912SDave May {
1743d8588912SDave May   Mat            A;
1744d8588912SDave May   PetscErrorCode ierr;
1745d8588912SDave May 
1746d8588912SDave May   PetscFunctionBegin;
1747*f4259b30SLisandro Dalcin   *B   = NULL;
1748d8588912SDave May   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
1749c8883902SJed Brown   ierr = MatSetType(A,MATNEST);CHKERRQ(ierr);
175091a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
1751c8883902SJed Brown   ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr);
1752d8588912SDave May   *B   = A;
1753d8588912SDave May   PetscFunctionReturn(0);
1754d8588912SDave May }
1755659c6bb0SJed Brown 
1756b68353e5Sstefano_zampini static PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1757b68353e5Sstefano_zampini {
1758b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
175923875855Sstefano_zampini   Mat            *trans;
1760b68353e5Sstefano_zampini   PetscScalar    **avv;
1761b68353e5Sstefano_zampini   PetscScalar    *vv;
1762b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1763b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1764b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1765b68353e5Sstefano_zampini   PetscBool      done;
1766b68353e5Sstefano_zampini   PetscErrorCode ierr;
1767b68353e5Sstefano_zampini 
1768b68353e5Sstefano_zampini   PetscFunctionBegin;
1769b68353e5Sstefano_zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
1770b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1771b68353e5Sstefano_zampini     PetscInt rnr;
1772b68353e5Sstefano_zampini 
1773b68353e5Sstefano_zampini     ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
1774b68353e5Sstefano_zampini     if (!done) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
1775b68353e5Sstefano_zampini     if (rnr != nr) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
1776b68353e5Sstefano_zampini     ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr);
1777b68353e5Sstefano_zampini   }
1778b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1779b68353e5Sstefano_zampini   nnz  = 0;
178023875855Sstefano_zampini   ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr);
1781b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1782b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1783b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1784b68353e5Sstefano_zampini       if (B) {
1785b68353e5Sstefano_zampini         PetscScalar *naa;
1786b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
178723875855Sstefano_zampini         PetscBool   istrans;
1788b68353e5Sstefano_zampini 
178923875855Sstefano_zampini         ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
179023875855Sstefano_zampini         if (istrans) {
179123875855Sstefano_zampini           Mat Bt;
179223875855Sstefano_zampini 
179323875855Sstefano_zampini           ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
179423875855Sstefano_zampini           ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr);
179523875855Sstefano_zampini           B    = trans[i*nest->nc+j];
179623875855Sstefano_zampini         }
1797b68353e5Sstefano_zampini         ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr);
1798b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
1799b68353e5Sstefano_zampini         ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr);
1800b68353e5Sstefano_zampini         nnz += nii[nnr];
1801b68353e5Sstefano_zampini 
1802b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1803b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1804b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1805b68353e5Sstefano_zampini       }
1806b68353e5Sstefano_zampini     }
1807b68353e5Sstefano_zampini   }
1808b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
1809b68353e5Sstefano_zampini     ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr);
1810b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr);
1811b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr);
1812b68353e5Sstefano_zampini   } else {
1813b68353e5Sstefano_zampini     if (nnz != ii[nr]) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1814b68353e5Sstefano_zampini   }
1815b68353e5Sstefano_zampini 
1816b68353e5Sstefano_zampini   /* new row pointer */
1817580bdb30SBarry Smith   ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr);
1818b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1819b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1820b68353e5Sstefano_zampini 
1821b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1822b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1823b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1824b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1825b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1826b68353e5Sstefano_zampini         PetscInt    ir;
1827b68353e5Sstefano_zampini 
1828b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1829b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1830b68353e5Sstefano_zampini           nii++;
1831b68353e5Sstefano_zampini         }
1832b68353e5Sstefano_zampini       }
1833b68353e5Sstefano_zampini     }
1834b68353e5Sstefano_zampini   }
1835b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1836b68353e5Sstefano_zampini 
1837b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
1838b68353e5Sstefano_zampini   ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr);
1839b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1840b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1841b68353e5Sstefano_zampini 
1842b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1843b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1844b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1845b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1846b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1847b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1848b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1849b68353e5Sstefano_zampini         PetscInt    ir,cst;
1850b68353e5Sstefano_zampini 
1851b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr);
1852b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1853b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1854b68353e5Sstefano_zampini 
1855b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1856b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1857b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1858b68353e5Sstefano_zampini             njj++;
1859b68353e5Sstefano_zampini             nvv++;
1860b68353e5Sstefano_zampini           }
1861b68353e5Sstefano_zampini           ci[ir] += rsize;
1862b68353e5Sstefano_zampini           nii++;
1863b68353e5Sstefano_zampini         }
1864b68353e5Sstefano_zampini       }
1865b68353e5Sstefano_zampini     }
1866b68353e5Sstefano_zampini   }
1867b68353e5Sstefano_zampini   ierr = PetscFree(ci);CHKERRQ(ierr);
1868b68353e5Sstefano_zampini 
1869b68353e5Sstefano_zampini   /* restore info */
1870b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1871b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1872b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1873b68353e5Sstefano_zampini       if (B) {
1874b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
187523875855Sstefano_zampini 
187623875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
1877b68353e5Sstefano_zampini         ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr);
1878b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
1879b68353e5Sstefano_zampini         ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr);
188023875855Sstefano_zampini         ierr = MatDestroy(&trans[k]);CHKERRQ(ierr);
1881b68353e5Sstefano_zampini       }
1882b68353e5Sstefano_zampini     }
1883b68353e5Sstefano_zampini   }
188423875855Sstefano_zampini   ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr);
1885b68353e5Sstefano_zampini 
1886b68353e5Sstefano_zampini   /* finalize newmat */
1887b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
1888b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr);
1889b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1890b68353e5Sstefano_zampini     Mat B;
1891b68353e5Sstefano_zampini 
1892b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr);
1893b68353e5Sstefano_zampini     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
1894b68353e5Sstefano_zampini   }
1895b68353e5Sstefano_zampini   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1896b68353e5Sstefano_zampini   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1897b68353e5Sstefano_zampini   {
1898b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1899b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1900b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1901b68353e5Sstefano_zampini   }
1902b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1903b68353e5Sstefano_zampini }
1904b68353e5Sstefano_zampini 
1905cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1906629c3df2SDmitry Karpeev {
1907629c3df2SDmitry Karpeev   PetscErrorCode ierr;
1908629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
190983b1a929SMark Adams   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart;
1910649b366bSFande Kong   PetscInt       cstart,cend;
1911b68353e5Sstefano_zampini   PetscMPIInt    size;
1912629c3df2SDmitry Karpeev   Mat            C;
1913629c3df2SDmitry Karpeev 
1914629c3df2SDmitry Karpeev   PetscFunctionBegin;
1915b68353e5Sstefano_zampini   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRQ(ierr);
1916b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
1917b68353e5Sstefano_zampini     PetscInt  nf;
1918b68353e5Sstefano_zampini     PetscBool fast;
1919b68353e5Sstefano_zampini 
1920b68353e5Sstefano_zampini     ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr);
1921b68353e5Sstefano_zampini     if (!fast) {
1922b68353e5Sstefano_zampini       ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr);
1923b68353e5Sstefano_zampini     }
1924b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
1925b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
1926b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
1927b68353e5Sstefano_zampini         if (B) {
1928b68353e5Sstefano_zampini           ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr);
192923875855Sstefano_zampini           if (!fast) {
193023875855Sstefano_zampini             PetscBool istrans;
193123875855Sstefano_zampini 
193223875855Sstefano_zampini             ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
193323875855Sstefano_zampini             if (istrans) {
193423875855Sstefano_zampini               Mat Bt;
193523875855Sstefano_zampini 
193623875855Sstefano_zampini               ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
193723875855Sstefano_zampini               ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr);
193823875855Sstefano_zampini             }
1939b68353e5Sstefano_zampini           }
1940b68353e5Sstefano_zampini         }
1941b68353e5Sstefano_zampini       }
1942b68353e5Sstefano_zampini     }
1943b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
1944b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1945b68353e5Sstefano_zampini       if (fast) {
1946b68353e5Sstefano_zampini         PetscInt f,s;
1947b68353e5Sstefano_zampini 
1948b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr);
1949b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1950b68353e5Sstefano_zampini         else {
1951b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr);
1952b68353e5Sstefano_zampini           nf  += f;
1953b68353e5Sstefano_zampini         }
1954b68353e5Sstefano_zampini       }
1955b68353e5Sstefano_zampini     }
1956b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
1957b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1958b68353e5Sstefano_zampini       if (fast) {
1959b68353e5Sstefano_zampini         PetscInt f,s;
1960b68353e5Sstefano_zampini 
1961b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr);
1962b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1963b68353e5Sstefano_zampini         else {
1964b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr);
1965b68353e5Sstefano_zampini           nf  += f;
1966b68353e5Sstefano_zampini         }
1967b68353e5Sstefano_zampini       }
1968b68353e5Sstefano_zampini     }
1969b68353e5Sstefano_zampini     if (fast) {
1970b68353e5Sstefano_zampini       ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr);
1971b68353e5Sstefano_zampini       PetscFunctionReturn(0);
1972b68353e5Sstefano_zampini     }
1973b68353e5Sstefano_zampini   }
1974629c3df2SDmitry Karpeev   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
1975629c3df2SDmitry Karpeev   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
1976649b366bSFande Kong   ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr);
1977629c3df2SDmitry Karpeev   switch (reuse) {
1978629c3df2SDmitry Karpeev   case MAT_INITIAL_MATRIX:
1979ce94432eSBarry Smith     ierr    = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
1980629c3df2SDmitry Karpeev     ierr    = MatSetType(C,newtype);CHKERRQ(ierr);
1981629c3df2SDmitry Karpeev     ierr    = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1982629c3df2SDmitry Karpeev     *newmat = C;
1983629c3df2SDmitry Karpeev     break;
1984629c3df2SDmitry Karpeev   case MAT_REUSE_MATRIX:
1985629c3df2SDmitry Karpeev     C = *newmat;
1986629c3df2SDmitry Karpeev     break;
1987ce94432eSBarry Smith   default: SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MatReuse");
1988629c3df2SDmitry Karpeev   }
1989785e854fSJed Brown   ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr);
1990629c3df2SDmitry Karpeev   onnz = dnnz + m;
1991629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
1992629c3df2SDmitry Karpeev     dnnz[k] = 0;
1993629c3df2SDmitry Karpeev     onnz[k] = 0;
1994629c3df2SDmitry Karpeev   }
1995629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
1996629c3df2SDmitry Karpeev     IS             bNis;
1997629c3df2SDmitry Karpeev     PetscInt       bN;
1998629c3df2SDmitry Karpeev     const PetscInt *bNindices;
1999629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
2000629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
2001629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr);
2002629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2003629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2004629c3df2SDmitry Karpeev       PetscSF        bmsf;
2005649b366bSFande Kong       PetscSFNode    *iremote;
2006629c3df2SDmitry Karpeev       Mat            B;
2007649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
2008629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2009629c3df2SDmitry Karpeev       B = nest->m[i][j];
2010629c3df2SDmitry Karpeev       if (!B) continue;
2011629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2012629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2013ce94432eSBarry Smith       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr);
2014649b366bSFande Kong       ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr);
2015649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr);
2016649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr);
2017649b366bSFande Kong       for (k = 0; k < bm; ++k){
2018649b366bSFande Kong     	sub_dnnz[k] = 0;
2019649b366bSFande Kong     	sub_onnz[k] = 0;
2020649b366bSFande Kong       }
2021629c3df2SDmitry Karpeev       /*
2022629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
2023629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
2024629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
2025629c3df2SDmitry Karpeev        */
202683b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2027629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2028131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
2029629c3df2SDmitry Karpeev         const PetscInt *brcols;
2030a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
2031131c27b5Sprj-         PetscMPIInt    rowowner = 0;
2032629c3df2SDmitry Karpeev         ierr      = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr);
2033649b366bSFande Kong         /* how many roots  */
2034649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
2035649b366bSFande Kong         /* get nonzero pattern */
203683b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2037629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
2038629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
2039649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
2040649b366bSFande Kong             sub_dnnz[br]++;
2041649b366bSFande Kong           } else {
2042649b366bSFande Kong             sub_onnz[br]++;
2043649b366bSFande Kong           }
2044629c3df2SDmitry Karpeev         }
204583b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2046629c3df2SDmitry Karpeev       }
2047629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2048629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
2049649b366bSFande Kong       ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr);
2050649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2051649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2052649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2053649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2054649b366bSFande Kong       ierr = PetscFree(sub_dnnz);CHKERRQ(ierr);
2055649b366bSFande Kong       ierr = PetscFree(sub_onnz);CHKERRQ(ierr);
2056629c3df2SDmitry Karpeev       ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr);
2057629c3df2SDmitry Karpeev     }
205822d28d08SBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2059629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
206065a4a0a3Sstefano_zampini   }
206165a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
206265a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
206365a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
206465a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
2065629c3df2SDmitry Karpeev   }
2066629c3df2SDmitry Karpeev   ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr);
2067629c3df2SDmitry Karpeev   ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr);
2068629c3df2SDmitry Karpeev   ierr = PetscFree(dnnz);CHKERRQ(ierr);
2069629c3df2SDmitry Karpeev 
2070629c3df2SDmitry Karpeev   /* Fill by row */
2071629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
2072629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
2073629c3df2SDmitry Karpeev     IS             bNis;
2074629c3df2SDmitry Karpeev     PetscInt       bN;
2075629c3df2SDmitry Karpeev     const PetscInt *bNindices;
2076629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
2077629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr);
2078629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2079629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2080629c3df2SDmitry Karpeev       Mat            B;
2081629c3df2SDmitry Karpeev       PetscInt       bm, br;
2082629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2083629c3df2SDmitry Karpeev       B = nest->m[i][j];
2084629c3df2SDmitry Karpeev       if (!B) continue;
2085629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2086629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
208783b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2088629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2089629c3df2SDmitry Karpeev         PetscInt          row = bmindices[br], brncols,  *cols;
2090629c3df2SDmitry Karpeev         const PetscInt    *brcols;
2091629c3df2SDmitry Karpeev         const PetscScalar *brcoldata;
209283b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2093785e854fSJed Brown         ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr);
209426fbe8dcSKarl Rupp         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
2095629c3df2SDmitry Karpeev         /*
2096629c3df2SDmitry Karpeev           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
2097629c3df2SDmitry Karpeev           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
2098629c3df2SDmitry Karpeev          */
2099a2ea699eSBarry Smith         ierr = MatSetValues(C,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr);
210083b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2101629c3df2SDmitry Karpeev         ierr = PetscFree(cols);CHKERRQ(ierr);
2102629c3df2SDmitry Karpeev       }
2103629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2104629c3df2SDmitry Karpeev     }
2105a2ea699eSBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2106629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
2107629c3df2SDmitry Karpeev   }
2108629c3df2SDmitry Karpeev   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2109629c3df2SDmitry Karpeev   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2110629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
2111629c3df2SDmitry Karpeev }
2112629c3df2SDmitry Karpeev 
21138b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
21148b7d3b4bSBarry Smith {
21158b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
21163c6db4c4SPierre Jolivet   MatOperation   opAdd;
21178b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
21188b7d3b4bSBarry Smith   PetscBool      flg;
211952c5f739Sprj-   PetscErrorCode ierr;
212052c5f739Sprj-   PetscFunctionBegin;
21218b7d3b4bSBarry Smith 
212252c5f739Sprj-   *has = PETSC_FALSE;
21233c6db4c4SPierre Jolivet   if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) {
21243c6db4c4SPierre Jolivet     opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD);
21258b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
21268b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
21278b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
21283c6db4c4SPierre Jolivet         ierr = MatHasOperation(bA->m[i][j],opAdd,&flg);CHKERRQ(ierr);
21298b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
21308b7d3b4bSBarry Smith       }
21318b7d3b4bSBarry Smith     }
21328b7d3b4bSBarry Smith   }
21333c6db4c4SPierre Jolivet   if (((void**)mat->ops)[op]) *has = PETSC_TRUE;
21348b7d3b4bSBarry Smith   PetscFunctionReturn(0);
21358b7d3b4bSBarry Smith }
21368b7d3b4bSBarry Smith 
2137659c6bb0SJed Brown /*MC
2138659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
2139659c6bb0SJed Brown 
2140659c6bb0SJed Brown   Level: intermediate
2141659c6bb0SJed Brown 
2142659c6bb0SJed Brown   Notes:
2143659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
2144659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
2145950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
2146659c6bb0SJed Brown 
21478b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
21488b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
21498b7d3b4bSBarry Smith   than the nest matrix.
21508b7d3b4bSBarry Smith 
215179798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
215279798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
215379798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
2154659c6bb0SJed Brown M*/
21558cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
2156c8883902SJed Brown {
2157c8883902SJed Brown   Mat_Nest       *s;
2158c8883902SJed Brown   PetscErrorCode ierr;
2159c8883902SJed Brown 
2160c8883902SJed Brown   PetscFunctionBegin;
2161b00a9115SJed Brown   ierr    = PetscNewLog(A,&s);CHKERRQ(ierr);
2162c8883902SJed Brown   A->data = (void*)s;
2163e7c19651SJed Brown 
2164e7c19651SJed Brown   s->nr            = -1;
2165e7c19651SJed Brown   s->nc            = -1;
21660298fd71SBarry Smith   s->m             = NULL;
2167e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
2168c8883902SJed Brown 
2169c8883902SJed Brown   ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr);
217026fbe8dcSKarl Rupp 
2171c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
21729194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2173c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
21749194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2175f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2176c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2177c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2178c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2179c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
21806e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2181c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
21827dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2183c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2184c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2185*f4259b30SLisandro Dalcin   A->ops->getvecs               = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2186c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2187c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2188429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2189429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2190a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2191a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
219213135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2193f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
21948b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2195381b8e50SStefano Zampini   A->ops->missingdiagonal       = MatMissingDiagonal_Nest;
2196c8883902SJed Brown 
2197*f4259b30SLisandro Dalcin   A->spptr        = NULL;
2198c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2199c8883902SJed Brown 
2200c8883902SJed Brown   /* expose Nest api's */
2201bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest);CHKERRQ(ierr);
2202bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest);CHKERRQ(ierr);
2203bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest);CHKERRQ(ierr);
2204bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest);CHKERRQ(ierr);
2205bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest);CHKERRQ(ierr);
2206bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest);CHKERRQ(ierr);
2207bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest);CHKERRQ(ierr);
2208bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest);CHKERRQ(ierr);
22090899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
22100899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
221183b1a929SMark Adams   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ);CHKERRQ(ierr);
22125e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS);CHKERRQ(ierr);
22134222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
22144222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
22154222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
2216c8883902SJed Brown 
2217c8883902SJed Brown   ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr);
2218c8883902SJed Brown   PetscFunctionReturn(0);
2219c8883902SJed Brown }
2220