xref: /petsc/src/mat/impls/nest/matnest.c (revision ad227fea26420e7a31ef041a9fa1418814d171a8)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*);
706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat);
806a1af2fSStefano Zampini 
95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
10c8883902SJed Brown 
11d8588912SDave May /* private functions */
128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
13d8588912SDave May {
14d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
158188e55aSJed Brown   PetscInt       i,j;
16d8588912SDave May   PetscErrorCode ierr;
17d8588912SDave May 
18d8588912SDave May   PetscFunctionBegin;
198188e55aSJed Brown   *m = *n = *M = *N = 0;
208188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
218188e55aSJed Brown     PetscInt sm,sM;
228188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr);
238188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr);
248188e55aSJed Brown     *m  += sm;
258188e55aSJed Brown     *M  += sM;
26d8588912SDave May   }
278188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
288188e55aSJed Brown     PetscInt sn,sN;
298188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr);
308188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr);
318188e55aSJed Brown     *n  += sn;
328188e55aSJed Brown     *N  += sN;
33d8588912SDave May   }
34d8588912SDave May   PetscFunctionReturn(0);
35d8588912SDave May }
36d8588912SDave May 
37d8588912SDave May /* operations */
38207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
39d8588912SDave May {
40d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
41207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
42207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
43d8588912SDave May   PetscErrorCode ierr;
44d8588912SDave May 
45d8588912SDave May   PetscFunctionBegin;
46207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
47207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
48207556f9SJed Brown   for (i=0; i<nr; i++) {
49d8588912SDave May     ierr = VecZeroEntries(by[i]);CHKERRQ(ierr);
50207556f9SJed Brown     for (j=0; j<nc; j++) {
51207556f9SJed Brown       if (!bA->m[i][j]) continue;
52d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
53d8588912SDave May       ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr);
54d8588912SDave May     }
55d8588912SDave May   }
56207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
57207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
58d8588912SDave May   PetscFunctionReturn(0);
59d8588912SDave May }
60d8588912SDave May 
619194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
629194d70fSJed Brown {
639194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
649194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
659194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
669194d70fSJed Brown   PetscErrorCode ierr;
679194d70fSJed Brown 
689194d70fSJed Brown   PetscFunctionBegin;
699194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
709194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
719194d70fSJed Brown   for (i=0; i<nr; i++) {
729194d70fSJed Brown     if (y != z) {
739194d70fSJed Brown       Vec by;
749194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
759194d70fSJed Brown       ierr = VecCopy(by,bz[i]);CHKERRQ(ierr);
76336d21e7SJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
779194d70fSJed Brown     }
789194d70fSJed Brown     for (j=0; j<nc; j++) {
799194d70fSJed Brown       if (!bA->m[i][j]) continue;
809194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
819194d70fSJed Brown       ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr);
829194d70fSJed Brown     }
839194d70fSJed Brown   }
849194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
859194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
869194d70fSJed Brown   PetscFunctionReturn(0);
879194d70fSJed Brown }
889194d70fSJed Brown 
8952c5f739Sprj- typedef struct {
9052c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
9152c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
9252c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9352c5f739Sprj- } Nest_Dense;
9452c5f739Sprj- 
956718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C)
9652c5f739Sprj- {
976718818eSStefano Zampini   Mat_Nest          *bA;
9852c5f739Sprj-   Nest_Dense        *contents;
996718818eSStefano Zampini   Mat               viewB,viewC,productB,workC;
10052c5f739Sprj-   const PetscScalar *barray;
10152c5f739Sprj-   PetscScalar       *carray;
1026718818eSStefano Zampini   PetscInt          i,j,M,N,nr,nc,ldb,ldc;
10352c5f739Sprj-   PetscErrorCode    ierr;
1046718818eSStefano Zampini   Mat               A,B;
10552c5f739Sprj- 
10652c5f739Sprj-   PetscFunctionBegin;
1076718818eSStefano Zampini   MatCheckProduct(C,3);
1086718818eSStefano Zampini   A    = C->product->A;
1096718818eSStefano Zampini   B    = C->product->B;
1106718818eSStefano Zampini   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
1116718818eSStefano Zampini   if (!N) {
1126718818eSStefano Zampini     ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1136718818eSStefano Zampini     ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1146718818eSStefano Zampini     PetscFunctionReturn(0);
1156718818eSStefano Zampini   }
1166718818eSStefano Zampini   contents = (Nest_Dense*)C->product->data;
1176718818eSStefano Zampini   if (!contents) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty");
1186718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1196718818eSStefano Zampini   nr   = bA->nr;
1206718818eSStefano Zampini   nc   = bA->nc;
12152c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
12252c5f739Sprj-   ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr);
12352c5f739Sprj-   ierr = MatZeroEntries(C);CHKERRQ(ierr);
12452c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
1256718818eSStefano Zampini   ierr = MatDenseGetArrayWrite(C,&carray);CHKERRQ(ierr);
12652c5f739Sprj-   for (i=0; i<nr; i++) {
12752c5f739Sprj-     ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr);
12852c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr);
1296718818eSStefano Zampini     ierr = MatDenseSetLDA(viewC,ldc);CHKERRQ(ierr);
13052c5f739Sprj-     for (j=0; j<nc; j++) {
13152c5f739Sprj-       if (!bA->m[i][j]) continue;
13252c5f739Sprj-       ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
13352c5f739Sprj-       ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
1346718818eSStefano Zampini       ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
1354222ddf1SHong Zhang 
1364222ddf1SHong Zhang       /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */
1374222ddf1SHong Zhang       workC             = contents->workC[i*nc + j];
1384222ddf1SHong Zhang       productB          = workC->product->B;
1394222ddf1SHong Zhang       workC->product->B = viewB; /* use newly created dense matrix viewB */
1406718818eSStefano Zampini       ierr = MatProductNumeric(workC);CHKERRQ(ierr);
14152c5f739Sprj-       ierr = MatDestroy(&viewB);CHKERRQ(ierr);
1424222ddf1SHong Zhang       workC->product->B = productB; /* resume original B */
1434222ddf1SHong Zhang 
14452c5f739Sprj-       /* C[i] <- workC + C[i] */
14552c5f739Sprj-       ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr);
14652c5f739Sprj-     }
14752c5f739Sprj-     ierr = MatDestroy(&viewC);CHKERRQ(ierr);
14852c5f739Sprj-   }
1496718818eSStefano Zampini   ierr = MatDenseRestoreArrayWrite(C,&carray);CHKERRQ(ierr);
15052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
1514222ddf1SHong Zhang 
1524222ddf1SHong Zhang   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1534222ddf1SHong Zhang   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15452c5f739Sprj-   PetscFunctionReturn(0);
15552c5f739Sprj- }
15652c5f739Sprj- 
15752c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
15852c5f739Sprj- {
15952c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
16052c5f739Sprj-   PetscInt       i;
16152c5f739Sprj-   PetscErrorCode ierr;
16252c5f739Sprj- 
16352c5f739Sprj-   PetscFunctionBegin;
16452c5f739Sprj-   ierr = PetscFree(contents->tarray);CHKERRQ(ierr);
16552c5f739Sprj-   for (i=0; i<contents->k; i++) {
16652c5f739Sprj-     ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr);
16752c5f739Sprj-   }
16852c5f739Sprj-   ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr);
16952c5f739Sprj-   ierr = PetscFree(contents);CHKERRQ(ierr);
17052c5f739Sprj-   PetscFunctionReturn(0);
17152c5f739Sprj- }
17252c5f739Sprj- 
1736718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C)
17452c5f739Sprj- {
1756718818eSStefano Zampini   Mat_Nest          *bA;
1766718818eSStefano Zampini   Mat               viewB,workC;
17752c5f739Sprj-   const PetscScalar *barray;
1786718818eSStefano Zampini   PetscInt          i,j,M,N,m,n,nr,nc,maxm = 0,ldb;
1794222ddf1SHong Zhang   Nest_Dense        *contents=NULL;
1806718818eSStefano Zampini   PetscBool         cisdense;
18152c5f739Sprj-   PetscErrorCode    ierr;
1826718818eSStefano Zampini   Mat               A,B;
1836718818eSStefano Zampini   PetscReal         fill;
18452c5f739Sprj- 
18552c5f739Sprj-   PetscFunctionBegin;
1866718818eSStefano Zampini   MatCheckProduct(C,4);
1876718818eSStefano Zampini   if (C->product->data) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty");
1886718818eSStefano Zampini   A    = C->product->A;
1896718818eSStefano Zampini   B    = C->product->B;
1906718818eSStefano Zampini   fill = C->product->fill;
1916718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1926718818eSStefano Zampini   nr   = bA->nr;
1936718818eSStefano Zampini   nc   = bA->nc;
1946718818eSStefano Zampini   ierr = MatGetLocalSize(B,NULL,&n);CHKERRQ(ierr);
19552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
19652c5f739Sprj-   ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr);
19752c5f739Sprj-   ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr);
1986718818eSStefano Zampini   ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1996718818eSStefano Zampini   ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,"");CHKERRQ(ierr);
2006718818eSStefano Zampini   if (!cisdense) {
2016718818eSStefano Zampini     ierr = MatSetType(C,((PetscObject)B)->type_name);CHKERRQ(ierr);
2026718818eSStefano Zampini   }
20318992e5dSStefano Zampini   ierr = MatSetUp(C);CHKERRQ(ierr);
2046718818eSStefano Zampini   if (!N) {
2056718818eSStefano Zampini     C->ops->productnumeric = MatProductNumeric_Nest_Dense;
2066718818eSStefano Zampini     PetscFunctionReturn(0);
20752c5f739Sprj-   }
20852c5f739Sprj- 
20952c5f739Sprj-   ierr = PetscNew(&contents);CHKERRQ(ierr);
2106718818eSStefano Zampini   C->product->data = contents;
2116718818eSStefano Zampini   C->product->destroy = MatNest_DenseDestroy;
21252c5f739Sprj-   ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr);
21352c5f739Sprj-   contents->k = nr*nc;
21452c5f739Sprj-   for (i=0; i<nr; i++) {
21552c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr);
21652c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
21752c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
21852c5f739Sprj-   }
21952c5f739Sprj-   for (i=0; i<nc; i++) {
22052c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr);
22152c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
22252c5f739Sprj-   }
22352c5f739Sprj-   ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr);
22452c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
22552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
22652c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
22752c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
22852c5f739Sprj-   for (j=0; j<nc; j++) {
22952c5f739Sprj-     ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
23052c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
2316718818eSStefano Zampini     ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
23252c5f739Sprj-     for (i=0; i<nr; i++) {
23352c5f739Sprj-       if (!bA->m[i][j]) continue;
23452c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
2354222ddf1SHong Zhang 
2364222ddf1SHong Zhang       ierr = MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]);CHKERRQ(ierr);
2374222ddf1SHong Zhang       workC = contents->workC[i*nc + j];
2384222ddf1SHong Zhang       ierr = MatProductSetType(workC,MATPRODUCT_AB);CHKERRQ(ierr);
2394222ddf1SHong Zhang       ierr = MatProductSetAlgorithm(workC,"default");CHKERRQ(ierr);
2404222ddf1SHong Zhang       ierr = MatProductSetFill(workC,fill);CHKERRQ(ierr);
2414222ddf1SHong Zhang       ierr = MatProductSetFromOptions(workC);CHKERRQ(ierr);
2424222ddf1SHong Zhang       ierr = MatProductSymbolic(workC);CHKERRQ(ierr);
2434222ddf1SHong Zhang 
2446718818eSStefano Zampini       /* since tarray will be shared by all Mat */
2456718818eSStefano Zampini       ierr = MatSeqDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
2466718818eSStefano Zampini       ierr = MatMPIDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
24752c5f739Sprj-     }
24852c5f739Sprj-     ierr = MatDestroy(&viewB);CHKERRQ(ierr);
24952c5f739Sprj-   }
25052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
25152c5f739Sprj- 
2526718818eSStefano Zampini   C->ops->productnumeric = MatProductNumeric_Nest_Dense;
25352c5f739Sprj-   PetscFunctionReturn(0);
25452c5f739Sprj- }
25552c5f739Sprj- 
2564222ddf1SHong Zhang /* --------------------------------------------------------- */
2574222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C)
2584222ddf1SHong Zhang {
2594222ddf1SHong Zhang   PetscFunctionBegin;
2606718818eSStefano Zampini   C->ops->productsymbolic = MatProductSymbolic_Nest_Dense;
2614222ddf1SHong Zhang   PetscFunctionReturn(0);
2624222ddf1SHong Zhang }
2634222ddf1SHong Zhang 
2644222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C)
26552c5f739Sprj- {
26652c5f739Sprj-   PetscErrorCode ierr;
2674222ddf1SHong Zhang   Mat_Product    *product = C->product;
26852c5f739Sprj- 
26952c5f739Sprj-   PetscFunctionBegin;
2704222ddf1SHong Zhang   if (product->type == MATPRODUCT_AB) {
2714222ddf1SHong Zhang     ierr = MatProductSetFromOptions_Nest_Dense_AB(C);CHKERRQ(ierr);
2726718818eSStefano Zampini   }
27352c5f739Sprj-   PetscFunctionReturn(0);
27452c5f739Sprj- }
2754222ddf1SHong Zhang /* --------------------------------------------------------- */
27652c5f739Sprj- 
277207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
278d8588912SDave May {
279d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
280207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
281207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
282d8588912SDave May   PetscErrorCode ierr;
283d8588912SDave May 
284d8588912SDave May   PetscFunctionBegin;
285609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
286609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
287207556f9SJed Brown   for (j=0; j<nc; j++) {
288609e31cbSJed Brown     ierr = VecZeroEntries(by[j]);CHKERRQ(ierr);
289609e31cbSJed Brown     for (i=0; i<nr; i++) {
2906c75ac25SJed Brown       if (!bA->m[i][j]) continue;
291609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
292609e31cbSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr);
293d8588912SDave May     }
294d8588912SDave May   }
295609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
296609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
297d8588912SDave May   PetscFunctionReturn(0);
298d8588912SDave May }
299d8588912SDave May 
3009194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
3019194d70fSJed Brown {
3029194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
3039194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
3049194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
3059194d70fSJed Brown   PetscErrorCode ierr;
3069194d70fSJed Brown 
3079194d70fSJed Brown   PetscFunctionBegin;
3089194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3099194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3109194d70fSJed Brown   for (j=0; j<nc; j++) {
3119194d70fSJed Brown     if (y != z) {
3129194d70fSJed Brown       Vec by;
3139194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3149194d70fSJed Brown       ierr = VecCopy(by,bz[j]);CHKERRQ(ierr);
3159194d70fSJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3169194d70fSJed Brown     }
3179194d70fSJed Brown     for (i=0; i<nr; i++) {
3186c75ac25SJed Brown       if (!bA->m[i][j]) continue;
3199194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
3209194d70fSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr);
3219194d70fSJed Brown     }
3229194d70fSJed Brown   }
3239194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3249194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3259194d70fSJed Brown   PetscFunctionReturn(0);
3269194d70fSJed Brown }
3279194d70fSJed Brown 
328f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
329f8170845SAlex Fikl {
330f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
331f8170845SAlex Fikl   Mat            C;
332f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
333f8170845SAlex Fikl   PetscErrorCode ierr;
334f8170845SAlex Fikl 
335f8170845SAlex Fikl   PetscFunctionBegin;
336cf37664fSBarry Smith   if (reuse == MAT_INPLACE_MATRIX && nr != nc) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
337f8170845SAlex Fikl 
338cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
339f8170845SAlex Fikl     Mat *subs;
340f8170845SAlex Fikl     IS  *is_row,*is_col;
341f8170845SAlex Fikl 
342f8170845SAlex Fikl     ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr);
343f8170845SAlex Fikl     ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr);
344f8170845SAlex Fikl     ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr);
345cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
346ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
347ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
348ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
349ddeb9bd8SAlex Fikl         }
350ddeb9bd8SAlex Fikl       }
351ddeb9bd8SAlex Fikl     }
352ddeb9bd8SAlex Fikl 
353f8170845SAlex Fikl     ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr);
354f8170845SAlex Fikl     ierr = PetscFree(subs);CHKERRQ(ierr);
3553d994f23SBarry Smith     ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr);
356f8170845SAlex Fikl   } else {
357f8170845SAlex Fikl     C = *B;
358f8170845SAlex Fikl   }
359f8170845SAlex Fikl 
360f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
361f8170845SAlex Fikl   for (i=0; i<nr; i++) {
362f8170845SAlex Fikl     for (j=0; j<nc; j++) {
363f8170845SAlex Fikl       if (bA->m[i][j]) {
364f8170845SAlex Fikl         ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr);
365f8170845SAlex Fikl       } else {
366f8170845SAlex Fikl         bC->m[j][i] = NULL;
367f8170845SAlex Fikl       }
368f8170845SAlex Fikl     }
369f8170845SAlex Fikl   }
370f8170845SAlex Fikl 
371cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
372f8170845SAlex Fikl     *B = C;
373f8170845SAlex Fikl   } else {
374f8170845SAlex Fikl     ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr);
375f8170845SAlex Fikl   }
376f8170845SAlex Fikl   PetscFunctionReturn(0);
377f8170845SAlex Fikl }
378f8170845SAlex Fikl 
379e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
380e2d7f03fSJed Brown {
381e2d7f03fSJed Brown   PetscErrorCode ierr;
382e2d7f03fSJed Brown   IS             *lst = *list;
383e2d7f03fSJed Brown   PetscInt       i;
384e2d7f03fSJed Brown 
385e2d7f03fSJed Brown   PetscFunctionBegin;
386e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3876bf464f9SBarry Smith   for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);}
388e2d7f03fSJed Brown   ierr  = PetscFree(lst);CHKERRQ(ierr);
3890298fd71SBarry Smith   *list = NULL;
390e2d7f03fSJed Brown   PetscFunctionReturn(0);
391e2d7f03fSJed Brown }
392e2d7f03fSJed Brown 
39306a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A)
394d8588912SDave May {
395d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
396d8588912SDave May   PetscInt       i,j;
397d8588912SDave May   PetscErrorCode ierr;
398d8588912SDave May 
399d8588912SDave May   PetscFunctionBegin;
400d8588912SDave May   /* release the matrices and the place holders */
401e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr);
402e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr);
403e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
404e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
405d8588912SDave May 
406d8588912SDave May   ierr = PetscFree(vs->row_len);CHKERRQ(ierr);
407d8588912SDave May   ierr = PetscFree(vs->col_len);CHKERRQ(ierr);
40806a1af2fSStefano Zampini   ierr = PetscFree(vs->nnzstate);CHKERRQ(ierr);
409d8588912SDave May 
410207556f9SJed Brown   ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr);
411207556f9SJed Brown 
412d8588912SDave May   /* release the matrices and the place holders */
413d8588912SDave May   if (vs->m) {
414d8588912SDave May     for (i=0; i<vs->nr; i++) {
415d8588912SDave May       for (j=0; j<vs->nc; j++) {
4166bf464f9SBarry Smith         ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr);
417d8588912SDave May       }
418d8588912SDave May       ierr = PetscFree(vs->m[i]);CHKERRQ(ierr);
419d8588912SDave May     }
420d8588912SDave May     ierr = PetscFree(vs->m);CHKERRQ(ierr);
421d8588912SDave May   }
42206a1af2fSStefano Zampini 
42306a1af2fSStefano Zampini   /* restore defaults */
42406a1af2fSStefano Zampini   vs->nr = 0;
42506a1af2fSStefano Zampini   vs->nc = 0;
42606a1af2fSStefano Zampini   vs->splitassembly = PETSC_FALSE;
42706a1af2fSStefano Zampini   PetscFunctionReturn(0);
42806a1af2fSStefano Zampini }
42906a1af2fSStefano Zampini 
43006a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A)
43106a1af2fSStefano Zampini {
43206a1af2fSStefano Zampini   PetscErrorCode ierr;
43306a1af2fSStefano Zampini 
43406a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
435bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
436d8588912SDave May 
437bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",0);CHKERRQ(ierr);
438bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",0);CHKERRQ(ierr);
439bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",0);CHKERRQ(ierr);
440bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",0);CHKERRQ(ierr);
441bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",0);CHKERRQ(ierr);
442bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",0);CHKERRQ(ierr);
443bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",0);CHKERRQ(ierr);
444bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",0);CHKERRQ(ierr);
4450899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",0);CHKERRQ(ierr);
4460899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",0);CHKERRQ(ierr);
4475e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",0);CHKERRQ(ierr);
4485e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",0);CHKERRQ(ierr);
4494222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL);CHKERRQ(ierr);
4504222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL);CHKERRQ(ierr);
4514222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL);CHKERRQ(ierr);
452d8588912SDave May   PetscFunctionReturn(0);
453d8588912SDave May }
454d8588912SDave May 
455381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd)
456381b8e50SStefano Zampini {
457381b8e50SStefano Zampini   Mat_Nest       *vs = (Mat_Nest*)mat->data;
458381b8e50SStefano Zampini   PetscInt       i;
459381b8e50SStefano Zampini   PetscErrorCode ierr;
460381b8e50SStefano Zampini 
461381b8e50SStefano Zampini   PetscFunctionBegin;
462381b8e50SStefano Zampini   if (dd) *dd = 0;
463381b8e50SStefano Zampini   if (!vs->nr) {
464381b8e50SStefano Zampini     *missing = PETSC_TRUE;
465381b8e50SStefano Zampini     PetscFunctionReturn(0);
466381b8e50SStefano Zampini   }
467381b8e50SStefano Zampini   *missing = PETSC_FALSE;
468381b8e50SStefano Zampini   for (i = 0; i < vs->nr && !(*missing); i++) {
469381b8e50SStefano Zampini     *missing = PETSC_TRUE;
470381b8e50SStefano Zampini     if (vs->m[i][i]) {
471381b8e50SStefano Zampini       ierr = MatMissingDiagonal(vs->m[i][i],missing,NULL);CHKERRQ(ierr);
472381b8e50SStefano Zampini       if (*missing && dd) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented");
473381b8e50SStefano Zampini     }
474381b8e50SStefano Zampini   }
475381b8e50SStefano Zampini   PetscFunctionReturn(0);
476381b8e50SStefano Zampini }
477381b8e50SStefano Zampini 
478207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
479d8588912SDave May {
480d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
481d8588912SDave May   PetscInt       i,j;
482d8588912SDave May   PetscErrorCode ierr;
48306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
484d8588912SDave May 
485d8588912SDave May   PetscFunctionBegin;
486d8588912SDave May   for (i=0; i<vs->nr; i++) {
487d8588912SDave May     for (j=0; j<vs->nc; j++) {
48806a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
489e7c19651SJed Brown       if (vs->m[i][j]) {
490e7c19651SJed Brown         ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr);
491e7c19651SJed Brown         if (!vs->splitassembly) {
492e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
493e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
494e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
495e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
496e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
497e7c19651SJed Brown            */
498e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
49906a1af2fSStefano Zampini           ierr = MatGetNonzeroState(vs->m[i][j],&subnnzstate);CHKERRQ(ierr);
500e7c19651SJed Brown         }
501e7c19651SJed Brown       }
50206a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate);
50306a1af2fSStefano Zampini       vs->nnzstate[i*vs->nc+j] = subnnzstate;
504d8588912SDave May     }
505d8588912SDave May   }
50606a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
507d8588912SDave May   PetscFunctionReturn(0);
508d8588912SDave May }
509d8588912SDave May 
510207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
511d8588912SDave May {
512d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
513d8588912SDave May   PetscInt       i,j;
514d8588912SDave May   PetscErrorCode ierr;
515d8588912SDave May 
516d8588912SDave May   PetscFunctionBegin;
517d8588912SDave May   for (i=0; i<vs->nr; i++) {
518d8588912SDave May     for (j=0; j<vs->nc; j++) {
519e7c19651SJed Brown       if (vs->m[i][j]) {
520e7c19651SJed Brown         if (vs->splitassembly) {
521e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
522e7c19651SJed Brown         }
523e7c19651SJed Brown       }
524d8588912SDave May     }
525d8588912SDave May   }
526d8588912SDave May   PetscFunctionReturn(0);
527d8588912SDave May }
528d8588912SDave May 
529f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
530d8588912SDave May {
531207556f9SJed Brown   PetscErrorCode ierr;
532f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
533f349c1fdSJed Brown   PetscInt       j;
534f349c1fdSJed Brown   Mat            sub;
535d8588912SDave May 
536d8588912SDave May   PetscFunctionBegin;
5370298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
538f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
5394994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
540f349c1fdSJed Brown   *B = sub;
541f349c1fdSJed Brown   PetscFunctionReturn(0);
542d8588912SDave May }
543d8588912SDave May 
544f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
545f349c1fdSJed Brown {
546207556f9SJed Brown   PetscErrorCode ierr;
547f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
548f349c1fdSJed Brown   PetscInt       i;
549f349c1fdSJed Brown   Mat            sub;
550f349c1fdSJed Brown 
551f349c1fdSJed Brown   PetscFunctionBegin;
5520298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
553f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
5544994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
555f349c1fdSJed Brown   *B = sub;
556f349c1fdSJed Brown   PetscFunctionReturn(0);
557d8588912SDave May }
558d8588912SDave May 
559f349c1fdSJed Brown static PetscErrorCode MatNestFindIS(Mat A,PetscInt n,const IS list[],IS is,PetscInt *found)
560f349c1fdSJed Brown {
561f349c1fdSJed Brown   PetscErrorCode ierr;
562f349c1fdSJed Brown   PetscInt       i;
563f349c1fdSJed Brown   PetscBool      flg;
564f349c1fdSJed Brown 
565f349c1fdSJed Brown   PetscFunctionBegin;
566f349c1fdSJed Brown   PetscValidPointer(list,3);
567f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
568f349c1fdSJed Brown   PetscValidIntPointer(found,5);
569f349c1fdSJed Brown   *found = -1;
570f349c1fdSJed Brown   for (i=0; i<n; i++) {
571207556f9SJed Brown     if (!list[i]) continue;
572320466b0SStefano Zampini     ierr = ISEqualUnsorted(list[i],is,&flg);CHKERRQ(ierr);
573f349c1fdSJed Brown     if (flg) {
574f349c1fdSJed Brown       *found = i;
575f349c1fdSJed Brown       PetscFunctionReturn(0);
576f349c1fdSJed Brown     }
577f349c1fdSJed Brown   }
578ce94432eSBarry Smith   SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
579f349c1fdSJed Brown }
580f349c1fdSJed Brown 
5818188e55aSJed Brown /* Get a block row as a new MatNest */
5828188e55aSJed Brown static PetscErrorCode MatNestGetRow(Mat A,PetscInt row,Mat *B)
5838188e55aSJed Brown {
5848188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
5858188e55aSJed Brown   char           keyname[256];
5868188e55aSJed Brown   PetscErrorCode ierr;
5878188e55aSJed Brown 
5888188e55aSJed Brown   PetscFunctionBegin;
5890298fd71SBarry Smith   *B   = NULL;
5908caf3d72SBarry Smith   ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestRow_%D",row);CHKERRQ(ierr);
5918188e55aSJed Brown   ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr);
5928188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
5938188e55aSJed Brown 
594ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),1,NULL,vs->nc,vs->isglobal.col,vs->m[row],B);CHKERRQ(ierr);
59526fbe8dcSKarl Rupp 
5968188e55aSJed Brown   (*B)->assembled = A->assembled;
59726fbe8dcSKarl Rupp 
5988188e55aSJed Brown   ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr);
5998188e55aSJed Brown   ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */
6008188e55aSJed Brown   PetscFunctionReturn(0);
6018188e55aSJed Brown }
6028188e55aSJed Brown 
603f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
604f349c1fdSJed Brown {
605f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
6068188e55aSJed Brown   PetscErrorCode ierr;
6076b3a5b13SJed Brown   PetscInt       row,col;
608e072481dSJed Brown   PetscBool      same,isFullCol,isFullColGlobal;
609f349c1fdSJed Brown 
610f349c1fdSJed Brown   PetscFunctionBegin;
6118188e55aSJed Brown   /* Check if full column space. This is a hack */
6128188e55aSJed Brown   isFullCol = PETSC_FALSE;
613251f4c67SDmitry Karpeev   ierr      = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&same);CHKERRQ(ierr);
6148188e55aSJed Brown   if (same) {
61577019fcaSJed Brown     PetscInt n,first,step,i,an,am,afirst,astep;
6168188e55aSJed Brown     ierr      = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr);
6178188e55aSJed Brown     ierr      = ISGetLocalSize(iscol,&n);CHKERRQ(ierr);
61877019fcaSJed Brown     isFullCol = PETSC_TRUE;
61905ce4453SJed Brown     for (i=0,an=A->cmap->rstart; i<vs->nc; i++) {
62006a1af2fSStefano Zampini       ierr = PetscObjectTypeCompare((PetscObject)is->col[i],ISSTRIDE,&same);CHKERRQ(ierr);
62177019fcaSJed Brown       ierr = ISGetLocalSize(is->col[i],&am);CHKERRQ(ierr);
62206a1af2fSStefano Zampini       if (same) {
62306a1af2fSStefano Zampini         ierr = ISStrideGetInfo(is->col[i],&afirst,&astep);CHKERRQ(ierr);
62477019fcaSJed Brown         if (afirst != an || astep != step) isFullCol = PETSC_FALSE;
62506a1af2fSStefano Zampini       } else isFullCol = PETSC_FALSE;
62677019fcaSJed Brown       an += am;
62777019fcaSJed Brown     }
62805ce4453SJed Brown     if (an != A->cmap->rstart+n) isFullCol = PETSC_FALSE;
6298188e55aSJed Brown   }
630b2566f29SBarry Smith   ierr = MPIU_Allreduce(&isFullCol,&isFullColGlobal,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)iscol));CHKERRQ(ierr);
6318188e55aSJed Brown 
632427230ceSLisandro Dalcin   if (isFullColGlobal && vs->nc > 1) {
6338188e55aSJed Brown     PetscInt row;
6348188e55aSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
6358188e55aSJed Brown     ierr = MatNestGetRow(A,row,B);CHKERRQ(ierr);
6368188e55aSJed Brown   } else {
637f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
638f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nc,is->col,iscol,&col);CHKERRQ(ierr);
639b6480e04SStefano Zampini     if (!vs->m[row][col]) {
640b6480e04SStefano Zampini       PetscInt lr,lc;
641b6480e04SStefano Zampini 
642b6480e04SStefano Zampini       ierr = MatCreate(PetscObjectComm((PetscObject)A),&vs->m[row][col]);CHKERRQ(ierr);
643b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.row[row],&lr);CHKERRQ(ierr);
644b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.col[col],&lc);CHKERRQ(ierr);
645b6480e04SStefano Zampini       ierr = MatSetSizes(vs->m[row][col],lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
646fa9f0909SStefano Zampini       ierr = MatSetType(vs->m[row][col],MATAIJ);CHKERRQ(ierr);
647fa9f0909SStefano Zampini       ierr = MatSeqAIJSetPreallocation(vs->m[row][col],0,NULL);CHKERRQ(ierr);
648fa9f0909SStefano Zampini       ierr = MatMPIAIJSetPreallocation(vs->m[row][col],0,NULL,0,NULL);CHKERRQ(ierr);
649b6480e04SStefano Zampini       ierr = MatSetUp(vs->m[row][col]);CHKERRQ(ierr);
650b6480e04SStefano Zampini       ierr = MatAssemblyBegin(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
651b6480e04SStefano Zampini       ierr = MatAssemblyEnd(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
652b6480e04SStefano Zampini     }
653f349c1fdSJed Brown     *B = vs->m[row][col];
6548188e55aSJed Brown   }
655f349c1fdSJed Brown   PetscFunctionReturn(0);
656f349c1fdSJed Brown }
657f349c1fdSJed Brown 
65806a1af2fSStefano Zampini /*
65906a1af2fSStefano Zampini    TODO: This does not actually returns a submatrix we can modify
66006a1af2fSStefano Zampini */
6617dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
662f349c1fdSJed Brown {
663f349c1fdSJed Brown   PetscErrorCode ierr;
664f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
665f349c1fdSJed Brown   Mat            sub;
666f349c1fdSJed Brown 
667f349c1fdSJed Brown   PetscFunctionBegin;
668f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr);
669f349c1fdSJed Brown   switch (reuse) {
670f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
6717874fa86SDave May     if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); }
672f349c1fdSJed Brown     *B = sub;
673f349c1fdSJed Brown     break;
674f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
675ce94432eSBarry Smith     if (sub != *B) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
676f349c1fdSJed Brown     break;
677f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
678f349c1fdSJed Brown     break;
679511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
680511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
681f349c1fdSJed Brown   }
682f349c1fdSJed Brown   PetscFunctionReturn(0);
683f349c1fdSJed Brown }
684f349c1fdSJed Brown 
685f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
686f349c1fdSJed Brown {
687f349c1fdSJed Brown   PetscErrorCode ierr;
688f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
689f349c1fdSJed Brown   Mat            sub;
690f349c1fdSJed Brown 
691f349c1fdSJed Brown   PetscFunctionBegin;
692f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
693f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
694f349c1fdSJed Brown   if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);}
695f349c1fdSJed Brown   *B = sub;
696d8588912SDave May   PetscFunctionReturn(0);
697d8588912SDave May }
698d8588912SDave May 
699207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
700d8588912SDave May {
701d8588912SDave May   PetscErrorCode ierr;
702f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
703f349c1fdSJed Brown   Mat            sub;
704d8588912SDave May 
705d8588912SDave May   PetscFunctionBegin;
706f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
707ce94432eSBarry Smith   if (*B != sub) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
708f349c1fdSJed Brown   if (sub) {
709ce94432eSBarry Smith     if (((PetscObject)sub)->refct <= 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
7106bf464f9SBarry Smith     ierr = MatDestroy(B);CHKERRQ(ierr);
711d8588912SDave May   }
712d8588912SDave May   PetscFunctionReturn(0);
713d8588912SDave May }
714d8588912SDave May 
7157874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
7167874fa86SDave May {
7177874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
7187874fa86SDave May   PetscInt       i;
7197874fa86SDave May   PetscErrorCode ierr;
7207874fa86SDave May 
7217874fa86SDave May   PetscFunctionBegin;
7227874fa86SDave May   for (i=0; i<bA->nr; i++) {
723429bac76SJed Brown     Vec bv;
724429bac76SJed Brown     ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7257874fa86SDave May     if (bA->m[i][i]) {
726429bac76SJed Brown       ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr);
7277874fa86SDave May     } else {
7285159a857SMatthew G. Knepley       ierr = VecSet(bv,0.0);CHKERRQ(ierr);
7297874fa86SDave May     }
730429bac76SJed Brown     ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7317874fa86SDave May   }
7327874fa86SDave May   PetscFunctionReturn(0);
7337874fa86SDave May }
7347874fa86SDave May 
7357874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
7367874fa86SDave May {
7377874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
738429bac76SJed Brown   Vec            bl,*br;
7397874fa86SDave May   PetscInt       i,j;
7407874fa86SDave May   PetscErrorCode ierr;
7417874fa86SDave May 
7427874fa86SDave May   PetscFunctionBegin;
7433f800ebeSJed Brown   ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr);
7442e6472ebSElliott Sales de Andrade   if (r) {
745429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
7462e6472ebSElliott Sales de Andrade   }
7472e6472ebSElliott Sales de Andrade   bl = NULL;
7487874fa86SDave May   for (i=0; i<bA->nr; i++) {
7492e6472ebSElliott Sales de Andrade     if (l) {
750429bac76SJed Brown       ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
7512e6472ebSElliott Sales de Andrade     }
7527874fa86SDave May     for (j=0; j<bA->nc; j++) {
7537874fa86SDave May       if (bA->m[i][j]) {
754429bac76SJed Brown         ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr);
7557874fa86SDave May       }
7567874fa86SDave May     }
7572e6472ebSElliott Sales de Andrade     if (l) {
758a061e289SJed Brown       ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
7597874fa86SDave May     }
7602e6472ebSElliott Sales de Andrade   }
7612e6472ebSElliott Sales de Andrade   if (r) {
762429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
7632e6472ebSElliott Sales de Andrade   }
764429bac76SJed Brown   ierr = PetscFree(br);CHKERRQ(ierr);
7657874fa86SDave May   PetscFunctionReturn(0);
7667874fa86SDave May }
7677874fa86SDave May 
768a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
769a061e289SJed Brown {
770a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
771a061e289SJed Brown   PetscInt       i,j;
772a061e289SJed Brown   PetscErrorCode ierr;
773a061e289SJed Brown 
774a061e289SJed Brown   PetscFunctionBegin;
775a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
776a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
777a061e289SJed Brown       if (bA->m[i][j]) {
778a061e289SJed Brown         ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr);
779a061e289SJed Brown       }
780a061e289SJed Brown     }
781a061e289SJed Brown   }
782a061e289SJed Brown   PetscFunctionReturn(0);
783a061e289SJed Brown }
784a061e289SJed Brown 
785a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
786a061e289SJed Brown {
787a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
788a061e289SJed Brown   PetscInt       i;
789a061e289SJed Brown   PetscErrorCode ierr;
79006a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
791a061e289SJed Brown 
792a061e289SJed Brown   PetscFunctionBegin;
793a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
79406a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
795ce94432eSBarry Smith     if (!bA->m[i][i]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%D,%D)",i,i);
796a061e289SJed Brown     ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr);
79706a1af2fSStefano Zampini     ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
79806a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
79906a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
800a061e289SJed Brown   }
80106a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
802a061e289SJed Brown   PetscFunctionReturn(0);
803a061e289SJed Brown }
804a061e289SJed Brown 
80513135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
80613135bc6SAlex Fikl {
80713135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
80813135bc6SAlex Fikl   PetscInt       i;
80913135bc6SAlex Fikl   PetscErrorCode ierr;
81006a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
81113135bc6SAlex Fikl 
81213135bc6SAlex Fikl   PetscFunctionBegin;
81313135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
81406a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
81513135bc6SAlex Fikl     Vec              bv;
81613135bc6SAlex Fikl     ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
81713135bc6SAlex Fikl     if (bA->m[i][i]) {
81813135bc6SAlex Fikl       ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr);
81906a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
82013135bc6SAlex Fikl     }
82113135bc6SAlex Fikl     ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
82206a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
82306a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
82413135bc6SAlex Fikl   }
82506a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
82613135bc6SAlex Fikl   PetscFunctionReturn(0);
82713135bc6SAlex Fikl }
82813135bc6SAlex Fikl 
829f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
830f8170845SAlex Fikl {
831f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
832f8170845SAlex Fikl   PetscInt       i,j;
833f8170845SAlex Fikl   PetscErrorCode ierr;
834f8170845SAlex Fikl 
835f8170845SAlex Fikl   PetscFunctionBegin;
836f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
837f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
838f8170845SAlex Fikl       if (bA->m[i][j]) {
839f8170845SAlex Fikl         ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr);
840f8170845SAlex Fikl       }
841f8170845SAlex Fikl     }
842f8170845SAlex Fikl   }
843f8170845SAlex Fikl   PetscFunctionReturn(0);
844f8170845SAlex Fikl }
845f8170845SAlex Fikl 
8462a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
847d8588912SDave May {
848d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
849d8588912SDave May   Vec            *L,*R;
850d8588912SDave May   MPI_Comm       comm;
851d8588912SDave May   PetscInt       i,j;
852d8588912SDave May   PetscErrorCode ierr;
853d8588912SDave May 
854d8588912SDave May   PetscFunctionBegin;
855ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
856d8588912SDave May   if (right) {
857d8588912SDave May     /* allocate R */
858854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr);
859d8588912SDave May     /* Create the right vectors */
860d8588912SDave May     for (j=0; j<bA->nc; j++) {
861d8588912SDave May       for (i=0; i<bA->nr; i++) {
862d8588912SDave May         if (bA->m[i][j]) {
8632a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr);
864d8588912SDave May           break;
865d8588912SDave May         }
866d8588912SDave May       }
8676c4ed002SBarry Smith       if (i==bA->nr) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
868d8588912SDave May     }
869f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr);
870d8588912SDave May     /* hand back control to the nest vector */
871d8588912SDave May     for (j=0; j<bA->nc; j++) {
8726bf464f9SBarry Smith       ierr = VecDestroy(&R[j]);CHKERRQ(ierr);
873d8588912SDave May     }
874d8588912SDave May     ierr = PetscFree(R);CHKERRQ(ierr);
875d8588912SDave May   }
876d8588912SDave May 
877d8588912SDave May   if (left) {
878d8588912SDave May     /* allocate L */
879854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr);
880d8588912SDave May     /* Create the left vectors */
881d8588912SDave May     for (i=0; i<bA->nr; i++) {
882d8588912SDave May       for (j=0; j<bA->nc; j++) {
883d8588912SDave May         if (bA->m[i][j]) {
8842a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr);
885d8588912SDave May           break;
886d8588912SDave May         }
887d8588912SDave May       }
8886c4ed002SBarry Smith       if (j==bA->nc) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
889d8588912SDave May     }
890d8588912SDave May 
891f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr);
892d8588912SDave May     for (i=0; i<bA->nr; i++) {
8936bf464f9SBarry Smith       ierr = VecDestroy(&L[i]);CHKERRQ(ierr);
894d8588912SDave May     }
895d8588912SDave May 
896d8588912SDave May     ierr = PetscFree(L);CHKERRQ(ierr);
897d8588912SDave May   }
898d8588912SDave May   PetscFunctionReturn(0);
899d8588912SDave May }
900d8588912SDave May 
901207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
902d8588912SDave May {
903d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
90429e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
905d8588912SDave May   PetscInt       i,j;
906d8588912SDave May   PetscErrorCode ierr;
907d8588912SDave May 
908d8588912SDave May   PetscFunctionBegin;
909251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
910d8588912SDave May   if (isascii) {
911d8588912SDave May 
91229e60adbSStefano Zampini     ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr);
913d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr);
914d86155a6SBarry Smith     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
915d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%D, cols=%D \n",bA->nr,bA->nc);CHKERRQ(ierr);
916d8588912SDave May 
917d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr);
918d8588912SDave May     for (i=0; i<bA->nr; i++) {
919d8588912SDave May       for (j=0; j<bA->nc; j++) {
92019fd82e9SBarry Smith         MatType   type;
921270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
922d8588912SDave May         PetscInt  NR,NC;
923d8588912SDave May         PetscBool isNest = PETSC_FALSE;
924d8588912SDave May 
925d8588912SDave May         if (!bA->m[i][j]) {
92685019af4SBarry Smith           ierr = PetscViewerASCIIPrintf(viewer, "(%D,%D) : NULL \n",i,j);CHKERRQ(ierr);
927d8588912SDave May           continue;
928d8588912SDave May         }
929d8588912SDave May         ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr);
930d8588912SDave May         ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr);
9318caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);}
9328caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);}
933251f4c67SDmitry Karpeev         ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr);
934d8588912SDave May 
935270f95d7SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"(%D,%D) : %s%stype=%s, rows=%D, cols=%D \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr);
936d8588912SDave May 
93729e60adbSStefano Zampini         if (isNest || viewSub) {
938270f95d7SJed Brown           ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);  /* push1 */
939d8588912SDave May           ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr);
940270f95d7SJed Brown           ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop1 */
941d8588912SDave May         }
942d8588912SDave May       }
943d8588912SDave May     }
944d86155a6SBarry Smith     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop0 */
945d8588912SDave May   }
946d8588912SDave May   PetscFunctionReturn(0);
947d8588912SDave May }
948d8588912SDave May 
949207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
950d8588912SDave May {
951d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
952d8588912SDave May   PetscInt       i,j;
953d8588912SDave May   PetscErrorCode ierr;
954d8588912SDave May 
955d8588912SDave May   PetscFunctionBegin;
956d8588912SDave May   for (i=0; i<bA->nr; i++) {
957d8588912SDave May     for (j=0; j<bA->nc; j++) {
958d8588912SDave May       if (!bA->m[i][j]) continue;
959d8588912SDave May       ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr);
960d8588912SDave May     }
961d8588912SDave May   }
962d8588912SDave May   PetscFunctionReturn(0);
963d8588912SDave May }
964d8588912SDave May 
965c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
966c222c20dSDavid Ham {
967c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
968c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
969c222c20dSDavid Ham   PetscErrorCode ierr;
97006a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
971c222c20dSDavid Ham 
972c222c20dSDavid Ham   PetscFunctionBegin;
973c222c20dSDavid Ham   if (nr != bB->nr || nc != bB->nc) SETERRQ4(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%D,%D) to a Mat_Nest of block size (%D,%D)",bB->nr,bB->nc,nr,nc);
974c222c20dSDavid Ham   for (i=0; i<nr; i++) {
975c222c20dSDavid Ham     for (j=0; j<nc; j++) {
97606a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
97746a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
978c222c20dSDavid Ham         ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr);
97946a2b97cSJed Brown       } else if (bA->m[i][j] || bB->m[i][j]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
98006a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bB->m[i][j],&subnnzstate);CHKERRQ(ierr);
98106a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate);
98206a1af2fSStefano Zampini       bB->nnzstate[i*nc+j] = subnnzstate;
983c222c20dSDavid Ham     }
984c222c20dSDavid Ham   }
98506a1af2fSStefano Zampini   if (nnzstate) B->nonzerostate++;
986c222c20dSDavid Ham   PetscFunctionReturn(0);
987c222c20dSDavid Ham }
988c222c20dSDavid Ham 
9896e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
9906e76ffeaSPierre Jolivet {
9916e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
9926e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
9936e76ffeaSPierre Jolivet   PetscErrorCode ierr;
99406a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
9956e76ffeaSPierre Jolivet 
9966e76ffeaSPierre Jolivet   PetscFunctionBegin;
9976e76ffeaSPierre Jolivet   if (nr != bX->nr || nc != bX->nc) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%D,%D) with a MatNest of block size (%D,%D)",bX->nr,bX->nc,nr,nc);
9986e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
9996e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
100006a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
10016e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
10026e76ffeaSPierre Jolivet         ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr);
1003c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
1004c066aebcSStefano Zampini         Mat M;
1005c066aebcSStefano Zampini 
1006060bfc19SStefano Zampini         if (str != DIFFERENT_NONZERO_PATTERN) SETERRQ2(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D. Use DIFFERENT_NONZERO_PATTERN",i,j);
1007c066aebcSStefano Zampini         ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr);
1008c066aebcSStefano Zampini         ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr);
1009c066aebcSStefano Zampini         ierr = MatDestroy(&M);CHKERRQ(ierr);
1010c066aebcSStefano Zampini       }
1011060bfc19SStefano Zampini       if (bY->m[i][j]) { ierr = MatGetNonzeroState(bY->m[i][j],&subnnzstate);CHKERRQ(ierr); }
101206a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate);
101306a1af2fSStefano Zampini       bY->nnzstate[i*nc+j] = subnnzstate;
10146e76ffeaSPierre Jolivet     }
10156e76ffeaSPierre Jolivet   }
101606a1af2fSStefano Zampini   if (nnzstate) Y->nonzerostate++;
10176e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
10186e76ffeaSPierre Jolivet }
10196e76ffeaSPierre Jolivet 
1020207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
1021d8588912SDave May {
1022d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1023841e96a3SJed Brown   Mat            *b;
1024841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1025d8588912SDave May   PetscErrorCode ierr;
1026d8588912SDave May 
1027d8588912SDave May   PetscFunctionBegin;
1028785e854fSJed Brown   ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr);
1029841e96a3SJed Brown   for (i=0; i<nr; i++) {
1030841e96a3SJed Brown     for (j=0; j<nc; j++) {
1031841e96a3SJed Brown       if (bA->m[i][j]) {
1032841e96a3SJed Brown         ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr);
1033841e96a3SJed Brown       } else {
10340298fd71SBarry Smith         b[i*nc+j] = NULL;
1035d8588912SDave May       }
1036d8588912SDave May     }
1037d8588912SDave May   }
1038ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr);
1039841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
1040841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
10416bf464f9SBarry Smith     ierr = MatDestroy(&b[i]);CHKERRQ(ierr);
1042d8588912SDave May   }
1043d8588912SDave May   ierr = PetscFree(b);CHKERRQ(ierr);
1044d8588912SDave May 
1045841e96a3SJed Brown   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1046841e96a3SJed Brown   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1047d8588912SDave May   PetscFunctionReturn(0);
1048d8588912SDave May }
1049d8588912SDave May 
1050d8588912SDave May /* nest api */
1051d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
1052d8588912SDave May {
1053d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
10545fd66863SKarl Rupp 
1055d8588912SDave May   PetscFunctionBegin;
1056ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1057ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
1058d8588912SDave May   *mat = bA->m[idxm][jdxm];
1059d8588912SDave May   PetscFunctionReturn(0);
1060d8588912SDave May }
1061d8588912SDave May 
10629ba0d327SJed Brown /*@
1063d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
1064d8588912SDave May 
1065d8588912SDave May  Not collective
1066d8588912SDave May 
1067d8588912SDave May  Input Parameters:
1068629881c0SJed Brown +   A  - nest matrix
1069d8588912SDave May .   idxm - index of the matrix within the nest matrix
1070629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
1071d8588912SDave May 
1072d8588912SDave May  Output Parameter:
1073d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
1074d8588912SDave May 
1075d8588912SDave May  Level: developer
1076d8588912SDave May 
1077bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(),
107879798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
1079d8588912SDave May @*/
10807087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
1081d8588912SDave May {
1082699a902aSJed Brown   PetscErrorCode ierr;
1083d8588912SDave May 
1084d8588912SDave May   PetscFunctionBegin;
1085699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr);
1086d8588912SDave May   PetscFunctionReturn(0);
1087d8588912SDave May }
1088d8588912SDave May 
10890782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
10900782ca92SJed Brown {
10910782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
10920782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
10930782ca92SJed Brown   PetscErrorCode ierr;
10940782ca92SJed Brown 
10950782ca92SJed Brown   PetscFunctionBegin;
1096ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1097ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
10980782ca92SJed Brown   ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr);
10990782ca92SJed Brown   ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr);
11000782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr);
11010782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr);
11020782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr);
11030782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr);
1104ce94432eSBarry Smith   if (M != Mi || N != Ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%D,%D) incompatible with nest block (%D,%D)",M,N,Mi,Ni);
1105ce94432eSBarry Smith   if (m != mi || n != ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%D,%D) incompatible with nest block (%D,%D)",m,n,mi,ni);
110626fbe8dcSKarl Rupp 
110706a1af2fSStefano Zampini   /* do not increase object state */
110806a1af2fSStefano Zampini   if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0);
110906a1af2fSStefano Zampini 
11100782ca92SJed Brown   ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr);
11110782ca92SJed Brown   ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr);
11120782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
111306a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
111406a1af2fSStefano Zampini   ierr = MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]);CHKERRQ(ierr);
111506a1af2fSStefano Zampini   A->nonzerostate++;
11160782ca92SJed Brown   PetscFunctionReturn(0);
11170782ca92SJed Brown }
11180782ca92SJed Brown 
11199ba0d327SJed Brown /*@
11200782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
11210782ca92SJed Brown 
11220782ca92SJed Brown  Logically collective on the submatrix communicator
11230782ca92SJed Brown 
11240782ca92SJed Brown  Input Parameters:
11250782ca92SJed Brown +   A  - nest matrix
11260782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
11270782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
11280782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
11290782ca92SJed Brown 
11300782ca92SJed Brown  Notes:
11310782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
11320782ca92SJed Brown 
11330782ca92SJed Brown  This increments the reference count of the submatrix.
11340782ca92SJed Brown 
11350782ca92SJed Brown  Level: developer
11360782ca92SJed Brown 
1137bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
113879798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
11390782ca92SJed Brown @*/
11400782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
11410782ca92SJed Brown {
11420782ca92SJed Brown   PetscErrorCode ierr;
11430782ca92SJed Brown 
11440782ca92SJed Brown   PetscFunctionBegin;
11450782ca92SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr);
11460782ca92SJed Brown   PetscFunctionReturn(0);
11470782ca92SJed Brown }
11480782ca92SJed Brown 
1149d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1150d8588912SDave May {
1151d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
11525fd66863SKarl Rupp 
1153d8588912SDave May   PetscFunctionBegin;
115426fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
115526fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
115626fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1157d8588912SDave May   PetscFunctionReturn(0);
1158d8588912SDave May }
1159d8588912SDave May 
1160d8588912SDave May /*@C
1161d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1162d8588912SDave May 
1163d8588912SDave May  Not collective
1164d8588912SDave May 
1165d8588912SDave May  Input Parameters:
1166629881c0SJed Brown .   A  - nest matrix
1167d8588912SDave May 
1168d8588912SDave May  Output Parameter:
1169629881c0SJed Brown +   M - number of rows in the nest matrix
1170d8588912SDave May .   N - number of cols in the nest matrix
1171629881c0SJed Brown -   mat - 2d array of matrices
1172d8588912SDave May 
1173d8588912SDave May  Notes:
1174d8588912SDave May 
1175d8588912SDave May  The user should not free the array mat.
1176d8588912SDave May 
1177351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1178351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1179351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1180351962e3SVincent Le Chenadec 
1181d8588912SDave May  Level: developer
1182d8588912SDave May 
1183bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
118479798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1185d8588912SDave May @*/
11867087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1187d8588912SDave May {
1188699a902aSJed Brown   PetscErrorCode ierr;
1189d8588912SDave May 
1190d8588912SDave May   PetscFunctionBegin;
1191699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr);
1192d8588912SDave May   PetscFunctionReturn(0);
1193d8588912SDave May }
1194d8588912SDave May 
11957087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1196d8588912SDave May {
1197d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1198d8588912SDave May 
1199d8588912SDave May   PetscFunctionBegin;
120026fbe8dcSKarl Rupp   if (M) *M = bA->nr;
120126fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1202d8588912SDave May   PetscFunctionReturn(0);
1203d8588912SDave May }
1204d8588912SDave May 
12059ba0d327SJed Brown /*@
1206d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1207d8588912SDave May 
1208d8588912SDave May  Not collective
1209d8588912SDave May 
1210d8588912SDave May  Input Parameters:
1211d8588912SDave May .   A  - nest matrix
1212d8588912SDave May 
1213d8588912SDave May  Output Parameter:
1214629881c0SJed Brown +   M - number of rows in the nested mat
1215629881c0SJed Brown -   N - number of cols in the nested mat
1216d8588912SDave May 
1217d8588912SDave May  Notes:
1218d8588912SDave May 
1219d8588912SDave May  Level: developer
1220d8588912SDave May 
1221bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(),
122279798668SBarry Smith           MatNestGetISs()
1223d8588912SDave May @*/
12247087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1225d8588912SDave May {
1226699a902aSJed Brown   PetscErrorCode ierr;
1227d8588912SDave May 
1228d8588912SDave May   PetscFunctionBegin;
1229699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr);
1230d8588912SDave May   PetscFunctionReturn(0);
1231d8588912SDave May }
1232d8588912SDave May 
1233f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1234900e7ff2SJed Brown {
1235900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1236900e7ff2SJed Brown   PetscInt i;
1237900e7ff2SJed Brown 
1238900e7ff2SJed Brown   PetscFunctionBegin;
1239900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1240900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1241900e7ff2SJed Brown   PetscFunctionReturn(0);
1242900e7ff2SJed Brown }
1243900e7ff2SJed Brown 
12443a4d7b9aSSatish Balay /*@C
1245900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1246900e7ff2SJed Brown 
1247900e7ff2SJed Brown  Not collective
1248900e7ff2SJed Brown 
1249900e7ff2SJed Brown  Input Parameters:
1250900e7ff2SJed Brown .   A  - nest matrix
1251900e7ff2SJed Brown 
1252900e7ff2SJed Brown  Output Parameter:
1253900e7ff2SJed Brown +   rows - array of row index sets
1254900e7ff2SJed Brown -   cols - array of column index sets
1255900e7ff2SJed Brown 
1256900e7ff2SJed Brown  Level: advanced
1257900e7ff2SJed Brown 
1258900e7ff2SJed Brown  Notes:
1259900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1260900e7ff2SJed Brown 
126179798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1262bb97c47cSPierre Jolivet           MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats()
1263900e7ff2SJed Brown @*/
1264900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1265900e7ff2SJed Brown {
1266900e7ff2SJed Brown   PetscErrorCode ierr;
1267900e7ff2SJed Brown 
1268900e7ff2SJed Brown   PetscFunctionBegin;
1269900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1270900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1271900e7ff2SJed Brown   PetscFunctionReturn(0);
1272900e7ff2SJed Brown }
1273900e7ff2SJed Brown 
1274f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1275900e7ff2SJed Brown {
1276900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1277900e7ff2SJed Brown   PetscInt i;
1278900e7ff2SJed Brown 
1279900e7ff2SJed Brown   PetscFunctionBegin;
1280900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1281900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1282900e7ff2SJed Brown   PetscFunctionReturn(0);
1283900e7ff2SJed Brown }
1284900e7ff2SJed Brown 
1285900e7ff2SJed Brown /*@C
1286900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1287900e7ff2SJed Brown 
1288900e7ff2SJed Brown  Not collective
1289900e7ff2SJed Brown 
1290900e7ff2SJed Brown  Input Parameters:
1291900e7ff2SJed Brown .   A  - nest matrix
1292900e7ff2SJed Brown 
1293900e7ff2SJed Brown  Output Parameter:
12940298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
12950298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1296900e7ff2SJed Brown 
1297900e7ff2SJed Brown  Level: advanced
1298900e7ff2SJed Brown 
1299900e7ff2SJed Brown  Notes:
1300900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1301900e7ff2SJed Brown 
1302bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(),
130379798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1304900e7ff2SJed Brown @*/
1305900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1306900e7ff2SJed Brown {
1307900e7ff2SJed Brown   PetscErrorCode ierr;
1308900e7ff2SJed Brown 
1309900e7ff2SJed Brown   PetscFunctionBegin;
1310900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1311900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1312900e7ff2SJed Brown   PetscFunctionReturn(0);
1313900e7ff2SJed Brown }
1314900e7ff2SJed Brown 
131519fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1316207556f9SJed Brown {
1317207556f9SJed Brown   PetscErrorCode ierr;
1318207556f9SJed Brown   PetscBool      flg;
1319207556f9SJed Brown 
1320207556f9SJed Brown   PetscFunctionBegin;
1321207556f9SJed Brown   ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr);
1322207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
13232a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
132412b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1325207556f9SJed Brown   PetscFunctionReturn(0);
1326207556f9SJed Brown }
1327207556f9SJed Brown 
1328207556f9SJed Brown /*@C
13292a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1330207556f9SJed Brown 
1331207556f9SJed Brown  Not collective
1332207556f9SJed Brown 
1333207556f9SJed Brown  Input Parameters:
1334207556f9SJed Brown +  A  - nest matrix
1335207556f9SJed Brown -  vtype - type to use for creating vectors
1336207556f9SJed Brown 
1337207556f9SJed Brown  Notes:
1338207556f9SJed Brown 
1339207556f9SJed Brown  Level: developer
1340207556f9SJed Brown 
1341bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest()
1342207556f9SJed Brown @*/
134319fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1344207556f9SJed Brown {
1345207556f9SJed Brown   PetscErrorCode ierr;
1346207556f9SJed Brown 
1347207556f9SJed Brown   PetscFunctionBegin;
134819fd82e9SBarry Smith   ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr);
1349207556f9SJed Brown   PetscFunctionReturn(0);
1350207556f9SJed Brown }
1351207556f9SJed Brown 
1352c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1353d8588912SDave May {
1354c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1355c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
1356d8588912SDave May   PetscErrorCode ierr;
135706a1af2fSStefano Zampini   PetscBool      cong;
1358d8588912SDave May 
1359d8588912SDave May   PetscFunctionBegin;
136006a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
136106a1af2fSStefano Zampini 
1362c8883902SJed Brown   s->nr = nr;
1363c8883902SJed Brown   s->nc = nc;
1364d8588912SDave May 
1365c8883902SJed Brown   /* Create space for submatrices */
1366854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr);
1367c8883902SJed Brown   for (i=0; i<nr; i++) {
1368854ce69bSBarry Smith     ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr);
1369d8588912SDave May   }
1370c8883902SJed Brown   for (i=0; i<nr; i++) {
1371c8883902SJed Brown     for (j=0; j<nc; j++) {
1372c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1373c8883902SJed Brown       if (a[i*nc+j]) {
1374c8883902SJed Brown         ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr);
1375d8588912SDave May       }
1376d8588912SDave May     }
1377d8588912SDave May   }
1378d8588912SDave May 
13798188e55aSJed Brown   ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr);
1380d8588912SDave May 
1381854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr);
1382854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr);
1383c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1384c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1385d8588912SDave May 
138606a1af2fSStefano Zampini   ierr = PetscCalloc1(nr*nc,&s->nnzstate);CHKERRQ(ierr);
138706a1af2fSStefano Zampini   for (i=0; i<nr; i++) {
138806a1af2fSStefano Zampini     for (j=0; j<nc; j++) {
138906a1af2fSStefano Zampini       if (s->m[i][j]) {
139006a1af2fSStefano Zampini         ierr = MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]);CHKERRQ(ierr);
139106a1af2fSStefano Zampini       }
139206a1af2fSStefano Zampini     }
139306a1af2fSStefano Zampini   }
139406a1af2fSStefano Zampini 
13958188e55aSJed Brown   ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr);
1396d8588912SDave May 
1397c8883902SJed Brown   ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr);
1398c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr);
1399c8883902SJed Brown   ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr);
1400c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr);
1401c8883902SJed Brown 
1402c8883902SJed Brown   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
1403c8883902SJed Brown   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
1404c8883902SJed Brown 
140506a1af2fSStefano Zampini   /* disable operations that are not supported for non-square matrices,
140606a1af2fSStefano Zampini      or matrices for which is_row != is_col  */
140706a1af2fSStefano Zampini   ierr = MatHasCongruentLayouts(A,&cong);CHKERRQ(ierr);
140806a1af2fSStefano Zampini   if (cong && nr != nc) cong = PETSC_FALSE;
140906a1af2fSStefano Zampini   if (cong) {
141006a1af2fSStefano Zampini     for (i = 0; cong && i < nr; i++) {
1411320466b0SStefano Zampini       ierr = ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong);CHKERRQ(ierr);
141206a1af2fSStefano Zampini     }
141306a1af2fSStefano Zampini   }
141406a1af2fSStefano Zampini   if (!cong) {
1415381b8e50SStefano Zampini     A->ops->missingdiagonal = NULL;
141606a1af2fSStefano Zampini     A->ops->getdiagonal     = NULL;
141706a1af2fSStefano Zampini     A->ops->shift           = NULL;
141806a1af2fSStefano Zampini     A->ops->diagonalset     = NULL;
141906a1af2fSStefano Zampini   }
142006a1af2fSStefano Zampini 
14211795a4d1SJed Brown   ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr);
142206a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
142306a1af2fSStefano Zampini   A->nonzerostate++;
1424d8588912SDave May   PetscFunctionReturn(0);
1425d8588912SDave May }
1426d8588912SDave May 
1427c8883902SJed Brown /*@
1428c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1429c8883902SJed Brown 
1430c8883902SJed Brown    Collective on Mat
1431c8883902SJed Brown 
1432c8883902SJed Brown    Input Parameter:
1433ffd6319bSRichard Tran Mills +  A - nested matrix
1434c8883902SJed Brown .  nr - number of nested row blocks
14350298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1436c8883902SJed Brown .  nc - number of nested column blocks
14370298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
14380298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1439c8883902SJed Brown 
144006a1af2fSStefano Zampini    Notes: this always resets any submatrix information previously set
144106a1af2fSStefano Zampini 
1442c8883902SJed Brown    Level: advanced
1443c8883902SJed Brown 
144479798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1445c8883902SJed Brown @*/
1446c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1447c8883902SJed Brown {
1448c8883902SJed Brown   PetscErrorCode ierr;
144906a1af2fSStefano Zampini   PetscInt       i;
1450c8883902SJed Brown 
1451c8883902SJed Brown   PetscFunctionBegin;
1452c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1453ce94432eSBarry Smith   if (nr < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1454c8883902SJed Brown   if (nr && is_row) {
1455c8883902SJed Brown     PetscValidPointer(is_row,3);
1456c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1457c8883902SJed Brown   }
1458ce94432eSBarry Smith   if (nc < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
14591664e352SJed Brown   if (nc && is_col) {
1460c8883902SJed Brown     PetscValidPointer(is_col,5);
14619b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1462c8883902SJed Brown   }
146306a1af2fSStefano Zampini   if (nr*nc > 0) PetscValidPointer(a,6);
1464c8883902SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr);
1465c8883902SJed Brown   PetscFunctionReturn(0);
1466c8883902SJed Brown }
1467d8588912SDave May 
146845b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
146977019fcaSJed Brown {
147077019fcaSJed Brown   PetscErrorCode ierr;
147177019fcaSJed Brown   PetscBool      flg;
147277019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
147377019fcaSJed Brown 
147477019fcaSJed Brown   PetscFunctionBegin;
1475aea6d515SStefano Zampini   *ltog = NULL;
147677019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
147777019fcaSJed Brown     if (islocal[i]) {
1478aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
147977019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
148077019fcaSJed Brown     } else {
1481aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
148277019fcaSJed Brown     }
148377019fcaSJed Brown     m += mi;
148477019fcaSJed Brown   }
1485aea6d515SStefano Zampini   if (!flg) PetscFunctionReturn(0);
1486aea6d515SStefano Zampini 
1487785e854fSJed Brown   ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr);
1488165cd838SBarry Smith   for (i=0,m=0; i<n; i++) {
14890298fd71SBarry Smith     ISLocalToGlobalMapping smap = NULL;
1490e108cb99SStefano Zampini     Mat                    sub = NULL;
1491f6d38dbbSStefano Zampini     PetscSF                sf;
1492f6d38dbbSStefano Zampini     PetscLayout            map;
1493aea6d515SStefano Zampini     const PetscInt         *ix2;
149477019fcaSJed Brown 
1495165cd838SBarry Smith     if (!colflg) {
149677019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
149777019fcaSJed Brown     } else {
149877019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
149977019fcaSJed Brown     }
1500191fd14bSBarry Smith     if (sub) {
1501191fd14bSBarry Smith       if (!colflg) {
1502191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr);
1503191fd14bSBarry Smith       } else {
1504191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr);
1505191fd14bSBarry Smith       }
1506191fd14bSBarry Smith     }
150777019fcaSJed Brown     /*
150877019fcaSJed Brown        Now we need to extract the monolithic global indices that correspond to the given split global indices.
150977019fcaSJed Brown        In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
151077019fcaSJed Brown     */
1511aea6d515SStefano Zampini     ierr = ISGetIndices(isglobal[i],&ix2);CHKERRQ(ierr);
1512aea6d515SStefano Zampini     if (islocal[i]) {
1513aea6d515SStefano Zampini       PetscInt *ilocal,*iremote;
1514aea6d515SStefano Zampini       PetscInt mil,nleaves;
1515aea6d515SStefano Zampini 
1516aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
1517aea6d515SStefano Zampini       if (!smap) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map");
1518aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = j;
1519aea6d515SStefano Zampini       ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr);
1520aea6d515SStefano Zampini 
1521aea6d515SStefano Zampini       /* PetscSFSetGraphLayout does not like negative indices */
1522aea6d515SStefano Zampini       ierr = PetscMalloc2(mi,&ilocal,mi,&iremote);CHKERRQ(ierr);
1523aea6d515SStefano Zampini       for (j=0, nleaves = 0; j<mi; j++) {
1524aea6d515SStefano Zampini         if (ix[m+j] < 0) continue;
1525aea6d515SStefano Zampini         ilocal[nleaves]  = j;
1526aea6d515SStefano Zampini         iremote[nleaves] = ix[m+j];
1527aea6d515SStefano Zampini         nleaves++;
1528aea6d515SStefano Zampini       }
1529aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mil);CHKERRQ(ierr);
1530aea6d515SStefano Zampini       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A),&sf);CHKERRQ(ierr);
1531aea6d515SStefano Zampini       ierr = PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map);CHKERRQ(ierr);
1532aea6d515SStefano Zampini       ierr = PetscLayoutSetLocalSize(map,mil);CHKERRQ(ierr);
1533f6d38dbbSStefano Zampini       ierr = PetscLayoutSetUp(map);CHKERRQ(ierr);
1534aea6d515SStefano Zampini       ierr = PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote);CHKERRQ(ierr);
1535f6d38dbbSStefano Zampini       ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr);
1536*ad227feaSJunchao Zhang       ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE);CHKERRQ(ierr);
1537*ad227feaSJunchao Zhang       ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE);CHKERRQ(ierr);
1538f6d38dbbSStefano Zampini       ierr = PetscSFDestroy(&sf);CHKERRQ(ierr);
1539aea6d515SStefano Zampini       ierr = PetscFree2(ilocal,iremote);CHKERRQ(ierr);
1540aea6d515SStefano Zampini     } else {
1541aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
1542aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = ix2[i];
1543aea6d515SStefano Zampini     }
1544aea6d515SStefano Zampini     ierr = ISRestoreIndices(isglobal[i],&ix2);CHKERRQ(ierr);
154577019fcaSJed Brown     m   += mi;
154677019fcaSJed Brown   }
1547f0413b6fSBarry Smith   ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr);
154877019fcaSJed Brown   PetscFunctionReturn(0);
154977019fcaSJed Brown }
155077019fcaSJed Brown 
155177019fcaSJed Brown 
1552d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1553d8588912SDave May /*
1554d8588912SDave May   nprocessors = NP
1555d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1556d8588912SDave May        proc 0: => (g_0,h_0,)
1557d8588912SDave May        proc 1: => (g_1,h_1,)
1558d8588912SDave May        ...
1559d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1560d8588912SDave May 
1561d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1562d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1563d8588912SDave May 
1564d8588912SDave May             proc 0:
1565d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1566d8588912SDave May             proc 1:
1567d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1568d8588912SDave May 
1569d8588912SDave May             proc NP-1:
1570d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1571d8588912SDave May */
1572841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1573d8588912SDave May {
1574e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
15758188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
1576d8588912SDave May   PetscErrorCode ierr;
15770298fd71SBarry Smith   Mat            sub = NULL;
1578d8588912SDave May 
1579d8588912SDave May   PetscFunctionBegin;
1580854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr);
1581854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr);
1582d8588912SDave May   if (is_row) { /* valid IS is passed in */
1583d8588912SDave May     /* refs on is[] are incremeneted */
1584e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1585d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr);
158626fbe8dcSKarl Rupp 
1587e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1588d8588912SDave May     }
15892ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
15908188e55aSJed Brown     nsum = 0;
15918188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
15928188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
1593ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %D",i);
15940298fd71SBarry Smith       ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
1595ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
15968188e55aSJed Brown       nsum += n;
15978188e55aSJed Brown     }
159855b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
159930bc264bSJed Brown     offset -= nsum;
1600e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1601f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16020298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
160373b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1604ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr);
1605e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr);
16062ae74bdbSJed Brown       offset += n;
1607d8588912SDave May     }
1608d8588912SDave May   }
1609d8588912SDave May 
1610d8588912SDave May   if (is_col) { /* valid IS is passed in */
1611d8588912SDave May     /* refs on is[] are incremeneted */
1612e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1613d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr);
161426fbe8dcSKarl Rupp 
1615e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1616d8588912SDave May     }
16172ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
16182ae74bdbSJed Brown     offset = A->cmap->rstart;
16198188e55aSJed Brown     nsum   = 0;
16208188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
16218188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
1622ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %D",i);
16230298fd71SBarry Smith       ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
1624ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16258188e55aSJed Brown       nsum += n;
16268188e55aSJed Brown     }
162755b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
162830bc264bSJed Brown     offset -= nsum;
1629e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1630f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
16310298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
163273b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1633ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr);
1634e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr);
16352ae74bdbSJed Brown       offset += n;
1636d8588912SDave May     }
1637d8588912SDave May   }
1638e2d7f03fSJed Brown 
1639e2d7f03fSJed Brown   /* Set up the local ISs */
1640785e854fSJed Brown   ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
1641785e854fSJed Brown   ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
1642e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1643e2d7f03fSJed Brown     IS                     isloc;
16440298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1645e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1646e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16470298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);}
1648207556f9SJed Brown     if (rmap) {
164973b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1650e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr);
1651e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1652e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1653207556f9SJed Brown     } else {
1654207556f9SJed Brown       nlocal = 0;
16550298fd71SBarry Smith       isloc  = NULL;
1656207556f9SJed Brown     }
1657e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1658e2d7f03fSJed Brown     offset            += nlocal;
1659e2d7f03fSJed Brown   }
16608188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1661e2d7f03fSJed Brown     IS                     isloc;
16620298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1663e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1664e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
16650298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);}
1666207556f9SJed Brown     if (cmap) {
166773b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1668e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr);
1669e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1670e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1671207556f9SJed Brown     } else {
1672207556f9SJed Brown       nlocal = 0;
16730298fd71SBarry Smith       isloc  = NULL;
1674207556f9SJed Brown     }
1675e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1676e2d7f03fSJed Brown     offset            += nlocal;
1677e2d7f03fSJed Brown   }
16780189643fSJed Brown 
167977019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
168077019fcaSJed Brown   {
168145b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
168245b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr);
168345b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr);
168477019fcaSJed Brown     if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);}
168577019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr);
168677019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr);
168777019fcaSJed Brown   }
168877019fcaSJed Brown 
168976bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
16900189643fSJed Brown     for (i=0; i<vs->nr; i++) {
16910189643fSJed Brown       for (j=0; j<vs->nc; j++) {
16920189643fSJed Brown         PetscInt m,n,M,N,mi,ni,Mi,Ni;
16930189643fSJed Brown         Mat      B = vs->m[i][j];
16940189643fSJed Brown         if (!B) continue;
16950189643fSJed Brown         ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr);
16960189643fSJed Brown         ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr);
16970189643fSJed Brown         ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr);
16980189643fSJed Brown         ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr);
16990189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr);
17000189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr);
1701ce94432eSBarry Smith         if (M != Mi || N != Ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",M,N,i,j,Mi,Ni);
1702ce94432eSBarry Smith         if (m != mi || n != ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",m,n,i,j,mi,ni);
17030189643fSJed Brown       }
17040189643fSJed Brown     }
170576bd3646SJed Brown   }
1706a061e289SJed Brown 
1707a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1708a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1709a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1710a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1711a061e289SJed Brown     }
1712a061e289SJed Brown   }
1713a061e289SJed Brown   A->assembled = PETSC_TRUE;
1714d8588912SDave May   PetscFunctionReturn(0);
1715d8588912SDave May }
1716d8588912SDave May 
171745c38901SJed Brown /*@C
1718659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1719659c6bb0SJed Brown 
1720659c6bb0SJed Brown    Collective on Mat
1721659c6bb0SJed Brown 
1722659c6bb0SJed Brown    Input Parameter:
1723659c6bb0SJed Brown +  comm - Communicator for the new Mat
1724659c6bb0SJed Brown .  nr - number of nested row blocks
17250298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1726659c6bb0SJed Brown .  nc - number of nested column blocks
17270298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
17280298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1729659c6bb0SJed Brown 
1730659c6bb0SJed Brown    Output Parameter:
1731659c6bb0SJed Brown .  B - new matrix
1732659c6bb0SJed Brown 
1733659c6bb0SJed Brown    Level: advanced
1734659c6bb0SJed Brown 
173579798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
173679798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
173779798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1738659c6bb0SJed Brown @*/
17397087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1740d8588912SDave May {
1741d8588912SDave May   Mat            A;
1742d8588912SDave May   PetscErrorCode ierr;
1743d8588912SDave May 
1744d8588912SDave May   PetscFunctionBegin;
1745f4259b30SLisandro Dalcin   *B   = NULL;
1746d8588912SDave May   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
1747c8883902SJed Brown   ierr = MatSetType(A,MATNEST);CHKERRQ(ierr);
174891a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
1749c8883902SJed Brown   ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr);
1750d8588912SDave May   *B   = A;
1751d8588912SDave May   PetscFunctionReturn(0);
1752d8588912SDave May }
1753659c6bb0SJed Brown 
1754b68353e5Sstefano_zampini static PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1755b68353e5Sstefano_zampini {
1756b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
175723875855Sstefano_zampini   Mat            *trans;
1758b68353e5Sstefano_zampini   PetscScalar    **avv;
1759b68353e5Sstefano_zampini   PetscScalar    *vv;
1760b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1761b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1762b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1763b68353e5Sstefano_zampini   PetscBool      done;
1764b68353e5Sstefano_zampini   PetscErrorCode ierr;
1765b68353e5Sstefano_zampini 
1766b68353e5Sstefano_zampini   PetscFunctionBegin;
1767b68353e5Sstefano_zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
1768b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1769b68353e5Sstefano_zampini     PetscInt rnr;
1770b68353e5Sstefano_zampini 
1771b68353e5Sstefano_zampini     ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
1772b68353e5Sstefano_zampini     if (!done) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
1773b68353e5Sstefano_zampini     if (rnr != nr) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
1774b68353e5Sstefano_zampini     ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr);
1775b68353e5Sstefano_zampini   }
1776b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1777b68353e5Sstefano_zampini   nnz  = 0;
177823875855Sstefano_zampini   ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr);
1779b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1780b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1781b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1782b68353e5Sstefano_zampini       if (B) {
1783b68353e5Sstefano_zampini         PetscScalar *naa;
1784b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
178523875855Sstefano_zampini         PetscBool   istrans;
1786b68353e5Sstefano_zampini 
178723875855Sstefano_zampini         ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
178823875855Sstefano_zampini         if (istrans) {
178923875855Sstefano_zampini           Mat Bt;
179023875855Sstefano_zampini 
179123875855Sstefano_zampini           ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
179223875855Sstefano_zampini           ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr);
179323875855Sstefano_zampini           B    = trans[i*nest->nc+j];
179423875855Sstefano_zampini         }
1795b68353e5Sstefano_zampini         ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr);
1796b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
1797b68353e5Sstefano_zampini         ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr);
1798b68353e5Sstefano_zampini         nnz += nii[nnr];
1799b68353e5Sstefano_zampini 
1800b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1801b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1802b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1803b68353e5Sstefano_zampini       }
1804b68353e5Sstefano_zampini     }
1805b68353e5Sstefano_zampini   }
1806b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
1807b68353e5Sstefano_zampini     ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr);
1808b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr);
1809b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr);
1810b68353e5Sstefano_zampini   } else {
1811b68353e5Sstefano_zampini     if (nnz != ii[nr]) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1812b68353e5Sstefano_zampini   }
1813b68353e5Sstefano_zampini 
1814b68353e5Sstefano_zampini   /* new row pointer */
1815580bdb30SBarry Smith   ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr);
1816b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1817b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1818b68353e5Sstefano_zampini 
1819b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1820b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1821b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1822b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1823b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1824b68353e5Sstefano_zampini         PetscInt    ir;
1825b68353e5Sstefano_zampini 
1826b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1827b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1828b68353e5Sstefano_zampini           nii++;
1829b68353e5Sstefano_zampini         }
1830b68353e5Sstefano_zampini       }
1831b68353e5Sstefano_zampini     }
1832b68353e5Sstefano_zampini   }
1833b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1834b68353e5Sstefano_zampini 
1835b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
1836b68353e5Sstefano_zampini   ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr);
1837b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1838b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1839b68353e5Sstefano_zampini 
1840b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1841b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1842b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1843b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1844b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1845b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1846b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1847b68353e5Sstefano_zampini         PetscInt    ir,cst;
1848b68353e5Sstefano_zampini 
1849b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr);
1850b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1851b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1852b68353e5Sstefano_zampini 
1853b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1854b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1855b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1856b68353e5Sstefano_zampini             njj++;
1857b68353e5Sstefano_zampini             nvv++;
1858b68353e5Sstefano_zampini           }
1859b68353e5Sstefano_zampini           ci[ir] += rsize;
1860b68353e5Sstefano_zampini           nii++;
1861b68353e5Sstefano_zampini         }
1862b68353e5Sstefano_zampini       }
1863b68353e5Sstefano_zampini     }
1864b68353e5Sstefano_zampini   }
1865b68353e5Sstefano_zampini   ierr = PetscFree(ci);CHKERRQ(ierr);
1866b68353e5Sstefano_zampini 
1867b68353e5Sstefano_zampini   /* restore info */
1868b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1869b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1870b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1871b68353e5Sstefano_zampini       if (B) {
1872b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
187323875855Sstefano_zampini 
187423875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
1875b68353e5Sstefano_zampini         ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr);
1876b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
1877b68353e5Sstefano_zampini         ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr);
187823875855Sstefano_zampini         ierr = MatDestroy(&trans[k]);CHKERRQ(ierr);
1879b68353e5Sstefano_zampini       }
1880b68353e5Sstefano_zampini     }
1881b68353e5Sstefano_zampini   }
188223875855Sstefano_zampini   ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr);
1883b68353e5Sstefano_zampini 
1884b68353e5Sstefano_zampini   /* finalize newmat */
1885b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
1886b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr);
1887b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1888b68353e5Sstefano_zampini     Mat B;
1889b68353e5Sstefano_zampini 
1890b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr);
1891b68353e5Sstefano_zampini     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
1892b68353e5Sstefano_zampini   }
1893b68353e5Sstefano_zampini   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1894b68353e5Sstefano_zampini   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1895b68353e5Sstefano_zampini   {
1896b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1897b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1898b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1899b68353e5Sstefano_zampini   }
1900b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1901b68353e5Sstefano_zampini }
1902b68353e5Sstefano_zampini 
1903cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1904629c3df2SDmitry Karpeev {
1905629c3df2SDmitry Karpeev   PetscErrorCode ierr;
1906629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
190783b1a929SMark Adams   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart;
1908649b366bSFande Kong   PetscInt       cstart,cend;
1909b68353e5Sstefano_zampini   PetscMPIInt    size;
1910629c3df2SDmitry Karpeev   Mat            C;
1911629c3df2SDmitry Karpeev 
1912629c3df2SDmitry Karpeev   PetscFunctionBegin;
1913ffc4695bSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRMPI(ierr);
1914b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
1915b68353e5Sstefano_zampini     PetscInt  nf;
1916b68353e5Sstefano_zampini     PetscBool fast;
1917b68353e5Sstefano_zampini 
1918b68353e5Sstefano_zampini     ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr);
1919b68353e5Sstefano_zampini     if (!fast) {
1920b68353e5Sstefano_zampini       ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr);
1921b68353e5Sstefano_zampini     }
1922b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
1923b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
1924b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
1925b68353e5Sstefano_zampini         if (B) {
1926b68353e5Sstefano_zampini           ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr);
192723875855Sstefano_zampini           if (!fast) {
192823875855Sstefano_zampini             PetscBool istrans;
192923875855Sstefano_zampini 
193023875855Sstefano_zampini             ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
193123875855Sstefano_zampini             if (istrans) {
193223875855Sstefano_zampini               Mat Bt;
193323875855Sstefano_zampini 
193423875855Sstefano_zampini               ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
193523875855Sstefano_zampini               ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr);
193623875855Sstefano_zampini             }
1937b68353e5Sstefano_zampini           }
1938b68353e5Sstefano_zampini         }
1939b68353e5Sstefano_zampini       }
1940b68353e5Sstefano_zampini     }
1941b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
1942b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1943b68353e5Sstefano_zampini       if (fast) {
1944b68353e5Sstefano_zampini         PetscInt f,s;
1945b68353e5Sstefano_zampini 
1946b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr);
1947b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1948b68353e5Sstefano_zampini         else {
1949b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr);
1950b68353e5Sstefano_zampini           nf  += f;
1951b68353e5Sstefano_zampini         }
1952b68353e5Sstefano_zampini       }
1953b68353e5Sstefano_zampini     }
1954b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
1955b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1956b68353e5Sstefano_zampini       if (fast) {
1957b68353e5Sstefano_zampini         PetscInt f,s;
1958b68353e5Sstefano_zampini 
1959b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr);
1960b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1961b68353e5Sstefano_zampini         else {
1962b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr);
1963b68353e5Sstefano_zampini           nf  += f;
1964b68353e5Sstefano_zampini         }
1965b68353e5Sstefano_zampini       }
1966b68353e5Sstefano_zampini     }
1967b68353e5Sstefano_zampini     if (fast) {
1968b68353e5Sstefano_zampini       ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr);
1969b68353e5Sstefano_zampini       PetscFunctionReturn(0);
1970b68353e5Sstefano_zampini     }
1971b68353e5Sstefano_zampini   }
1972629c3df2SDmitry Karpeev   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
1973629c3df2SDmitry Karpeev   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
1974649b366bSFande Kong   ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr);
1975629c3df2SDmitry Karpeev   switch (reuse) {
1976629c3df2SDmitry Karpeev   case MAT_INITIAL_MATRIX:
1977ce94432eSBarry Smith     ierr    = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
1978629c3df2SDmitry Karpeev     ierr    = MatSetType(C,newtype);CHKERRQ(ierr);
1979629c3df2SDmitry Karpeev     ierr    = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1980629c3df2SDmitry Karpeev     *newmat = C;
1981629c3df2SDmitry Karpeev     break;
1982629c3df2SDmitry Karpeev   case MAT_REUSE_MATRIX:
1983629c3df2SDmitry Karpeev     C = *newmat;
1984629c3df2SDmitry Karpeev     break;
1985ce94432eSBarry Smith   default: SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MatReuse");
1986629c3df2SDmitry Karpeev   }
1987785e854fSJed Brown   ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr);
1988629c3df2SDmitry Karpeev   onnz = dnnz + m;
1989629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
1990629c3df2SDmitry Karpeev     dnnz[k] = 0;
1991629c3df2SDmitry Karpeev     onnz[k] = 0;
1992629c3df2SDmitry Karpeev   }
1993629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
1994629c3df2SDmitry Karpeev     IS             bNis;
1995629c3df2SDmitry Karpeev     PetscInt       bN;
1996629c3df2SDmitry Karpeev     const PetscInt *bNindices;
1997629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
1998629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
1999629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr);
2000629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2001629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2002629c3df2SDmitry Karpeev       PetscSF        bmsf;
2003649b366bSFande Kong       PetscSFNode    *iremote;
2004629c3df2SDmitry Karpeev       Mat            B;
2005649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
2006629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2007629c3df2SDmitry Karpeev       B = nest->m[i][j];
2008629c3df2SDmitry Karpeev       if (!B) continue;
2009629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2010629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2011ce94432eSBarry Smith       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr);
2012649b366bSFande Kong       ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr);
2013649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr);
2014649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr);
2015649b366bSFande Kong       for (k = 0; k < bm; ++k){
2016649b366bSFande Kong         sub_dnnz[k] = 0;
2017649b366bSFande Kong         sub_onnz[k] = 0;
2018649b366bSFande Kong       }
2019629c3df2SDmitry Karpeev       /*
2020629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
2021629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
2022629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
2023629c3df2SDmitry Karpeev        */
202483b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2025629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2026131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
2027629c3df2SDmitry Karpeev         const PetscInt *brcols;
2028a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
2029131c27b5Sprj-         PetscMPIInt    rowowner = 0;
2030629c3df2SDmitry Karpeev         ierr      = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr);
2031649b366bSFande Kong         /* how many roots  */
2032649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
2033649b366bSFande Kong         /* get nonzero pattern */
203483b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2035629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
2036629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
2037649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
2038649b366bSFande Kong             sub_dnnz[br]++;
2039649b366bSFande Kong           } else {
2040649b366bSFande Kong             sub_onnz[br]++;
2041649b366bSFande Kong           }
2042629c3df2SDmitry Karpeev         }
204383b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2044629c3df2SDmitry Karpeev       }
2045629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2046629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
2047649b366bSFande Kong       ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr);
2048649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2049649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2050649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2051649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2052649b366bSFande Kong       ierr = PetscFree(sub_dnnz);CHKERRQ(ierr);
2053649b366bSFande Kong       ierr = PetscFree(sub_onnz);CHKERRQ(ierr);
2054629c3df2SDmitry Karpeev       ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr);
2055629c3df2SDmitry Karpeev     }
205622d28d08SBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2057629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
205865a4a0a3Sstefano_zampini   }
205965a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
206065a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
206165a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
206265a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
2063629c3df2SDmitry Karpeev   }
2064629c3df2SDmitry Karpeev   ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr);
2065629c3df2SDmitry Karpeev   ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr);
2066629c3df2SDmitry Karpeev   ierr = PetscFree(dnnz);CHKERRQ(ierr);
2067629c3df2SDmitry Karpeev 
2068629c3df2SDmitry Karpeev   /* Fill by row */
2069629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
2070629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
2071629c3df2SDmitry Karpeev     IS             bNis;
2072629c3df2SDmitry Karpeev     PetscInt       bN;
2073629c3df2SDmitry Karpeev     const PetscInt *bNindices;
2074629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
2075629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr);
2076629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2077629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2078629c3df2SDmitry Karpeev       Mat            B;
2079629c3df2SDmitry Karpeev       PetscInt       bm, br;
2080629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2081629c3df2SDmitry Karpeev       B = nest->m[i][j];
2082629c3df2SDmitry Karpeev       if (!B) continue;
2083629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2084629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
208583b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2086629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2087629c3df2SDmitry Karpeev         PetscInt          row = bmindices[br], brncols,  *cols;
2088629c3df2SDmitry Karpeev         const PetscInt    *brcols;
2089629c3df2SDmitry Karpeev         const PetscScalar *brcoldata;
209083b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2091785e854fSJed Brown         ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr);
209226fbe8dcSKarl Rupp         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
2093629c3df2SDmitry Karpeev         /*
2094629c3df2SDmitry Karpeev           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
2095629c3df2SDmitry Karpeev           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
2096629c3df2SDmitry Karpeev          */
2097a2ea699eSBarry Smith         ierr = MatSetValues(C,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr);
209883b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2099629c3df2SDmitry Karpeev         ierr = PetscFree(cols);CHKERRQ(ierr);
2100629c3df2SDmitry Karpeev       }
2101629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2102629c3df2SDmitry Karpeev     }
2103a2ea699eSBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2104629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
2105629c3df2SDmitry Karpeev   }
2106629c3df2SDmitry Karpeev   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2107629c3df2SDmitry Karpeev   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2108629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
2109629c3df2SDmitry Karpeev }
2110629c3df2SDmitry Karpeev 
21118b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
21128b7d3b4bSBarry Smith {
21138b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
21143c6db4c4SPierre Jolivet   MatOperation   opAdd;
21158b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
21168b7d3b4bSBarry Smith   PetscBool      flg;
211752c5f739Sprj-   PetscErrorCode ierr;
211852c5f739Sprj-   PetscFunctionBegin;
21198b7d3b4bSBarry Smith 
212052c5f739Sprj-   *has = PETSC_FALSE;
21213c6db4c4SPierre Jolivet   if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) {
21223c6db4c4SPierre Jolivet     opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD);
21238b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
21248b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
21258b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
21263c6db4c4SPierre Jolivet         ierr = MatHasOperation(bA->m[i][j],opAdd,&flg);CHKERRQ(ierr);
21278b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
21288b7d3b4bSBarry Smith       }
21298b7d3b4bSBarry Smith     }
21308b7d3b4bSBarry Smith   }
21313c6db4c4SPierre Jolivet   if (((void**)mat->ops)[op]) *has = PETSC_TRUE;
21328b7d3b4bSBarry Smith   PetscFunctionReturn(0);
21338b7d3b4bSBarry Smith }
21348b7d3b4bSBarry Smith 
2135659c6bb0SJed Brown /*MC
2136659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
2137659c6bb0SJed Brown 
2138659c6bb0SJed Brown   Level: intermediate
2139659c6bb0SJed Brown 
2140659c6bb0SJed Brown   Notes:
2141659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
2142659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
2143950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
2144659c6bb0SJed Brown 
21458b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
21468b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
21478b7d3b4bSBarry Smith   than the nest matrix.
21488b7d3b4bSBarry Smith 
214979798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
215079798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
215179798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
2152659c6bb0SJed Brown M*/
21538cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
2154c8883902SJed Brown {
2155c8883902SJed Brown   Mat_Nest       *s;
2156c8883902SJed Brown   PetscErrorCode ierr;
2157c8883902SJed Brown 
2158c8883902SJed Brown   PetscFunctionBegin;
2159b00a9115SJed Brown   ierr    = PetscNewLog(A,&s);CHKERRQ(ierr);
2160c8883902SJed Brown   A->data = (void*)s;
2161e7c19651SJed Brown 
2162e7c19651SJed Brown   s->nr            = -1;
2163e7c19651SJed Brown   s->nc            = -1;
21640298fd71SBarry Smith   s->m             = NULL;
2165e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
2166c8883902SJed Brown 
2167c8883902SJed Brown   ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr);
216826fbe8dcSKarl Rupp 
2169c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
21709194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2171c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
21729194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2173f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2174c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2175c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2176c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2177c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
21786e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2179c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
21807dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2181c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2182c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2183f4259b30SLisandro Dalcin   A->ops->getvecs               = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2184c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2185c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2186429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2187429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2188a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2189a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
219013135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2191f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
21928b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2193381b8e50SStefano Zampini   A->ops->missingdiagonal       = MatMissingDiagonal_Nest;
2194c8883902SJed Brown 
2195f4259b30SLisandro Dalcin   A->spptr        = NULL;
2196c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2197c8883902SJed Brown 
2198c8883902SJed Brown   /* expose Nest api's */
2199bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest);CHKERRQ(ierr);
2200bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest);CHKERRQ(ierr);
2201bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest);CHKERRQ(ierr);
2202bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest);CHKERRQ(ierr);
2203bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest);CHKERRQ(ierr);
2204bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest);CHKERRQ(ierr);
2205bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest);CHKERRQ(ierr);
2206bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest);CHKERRQ(ierr);
22070899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
22080899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
220983b1a929SMark Adams   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ);CHKERRQ(ierr);
22105e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS);CHKERRQ(ierr);
22114222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
22124222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
22134222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
2214c8883902SJed Brown 
2215c8883902SJed Brown   ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr);
2216c8883902SJed Brown   PetscFunctionReturn(0);
2217c8883902SJed Brown }
2218