xref: /petsc/src/mat/impls/nest/matnest.c (revision be705e3a7cf841efc25acbae09e8f0554ea4f143)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*);
706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat);
806a1af2fSStefano Zampini 
95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
10c8883902SJed Brown 
11d8588912SDave May /* private functions */
128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
13d8588912SDave May {
14d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
158188e55aSJed Brown   PetscInt       i,j;
16d8588912SDave May   PetscErrorCode ierr;
17d8588912SDave May 
18d8588912SDave May   PetscFunctionBegin;
198188e55aSJed Brown   *m = *n = *M = *N = 0;
208188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
218188e55aSJed Brown     PetscInt sm,sM;
228188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr);
238188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr);
248188e55aSJed Brown     *m  += sm;
258188e55aSJed Brown     *M  += sM;
26d8588912SDave May   }
278188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
288188e55aSJed Brown     PetscInt sn,sN;
298188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr);
308188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr);
318188e55aSJed Brown     *n  += sn;
328188e55aSJed Brown     *N  += sN;
33d8588912SDave May   }
34d8588912SDave May   PetscFunctionReturn(0);
35d8588912SDave May }
36d8588912SDave May 
37d8588912SDave May /* operations */
38207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
39d8588912SDave May {
40d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
41207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
42207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
43d8588912SDave May   PetscErrorCode ierr;
44d8588912SDave May 
45d8588912SDave May   PetscFunctionBegin;
46207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
47207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
48207556f9SJed Brown   for (i=0; i<nr; i++) {
49d8588912SDave May     ierr = VecZeroEntries(by[i]);CHKERRQ(ierr);
50207556f9SJed Brown     for (j=0; j<nc; j++) {
51207556f9SJed Brown       if (!bA->m[i][j]) continue;
52d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
53d8588912SDave May       ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr);
54d8588912SDave May     }
55d8588912SDave May   }
56207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
57207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
58d8588912SDave May   PetscFunctionReturn(0);
59d8588912SDave May }
60d8588912SDave May 
619194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
629194d70fSJed Brown {
639194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
649194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
659194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
669194d70fSJed Brown   PetscErrorCode ierr;
679194d70fSJed Brown 
689194d70fSJed Brown   PetscFunctionBegin;
699194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
709194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
719194d70fSJed Brown   for (i=0; i<nr; i++) {
729194d70fSJed Brown     if (y != z) {
739194d70fSJed Brown       Vec by;
749194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
759194d70fSJed Brown       ierr = VecCopy(by,bz[i]);CHKERRQ(ierr);
76336d21e7SJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
779194d70fSJed Brown     }
789194d70fSJed Brown     for (j=0; j<nc; j++) {
799194d70fSJed Brown       if (!bA->m[i][j]) continue;
809194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
819194d70fSJed Brown       ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr);
829194d70fSJed Brown     }
839194d70fSJed Brown   }
849194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
859194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
869194d70fSJed Brown   PetscFunctionReturn(0);
879194d70fSJed Brown }
889194d70fSJed Brown 
8952c5f739Sprj- typedef struct {
9052c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
9152c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
9252c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9352c5f739Sprj- } Nest_Dense;
9452c5f739Sprj- 
956718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C)
9652c5f739Sprj- {
976718818eSStefano Zampini   Mat_Nest          *bA;
9852c5f739Sprj-   Nest_Dense        *contents;
996718818eSStefano Zampini   Mat               viewB,viewC,productB,workC;
10052c5f739Sprj-   const PetscScalar *barray;
10152c5f739Sprj-   PetscScalar       *carray;
1026718818eSStefano Zampini   PetscInt          i,j,M,N,nr,nc,ldb,ldc;
10352c5f739Sprj-   PetscErrorCode    ierr;
1046718818eSStefano Zampini   Mat               A,B;
10552c5f739Sprj- 
10652c5f739Sprj-   PetscFunctionBegin;
1076718818eSStefano Zampini   MatCheckProduct(C,3);
1086718818eSStefano Zampini   A    = C->product->A;
1096718818eSStefano Zampini   B    = C->product->B;
1106718818eSStefano Zampini   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
1116718818eSStefano Zampini   if (!N) {
1126718818eSStefano Zampini     ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1136718818eSStefano Zampini     ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1146718818eSStefano Zampini     PetscFunctionReturn(0);
1156718818eSStefano Zampini   }
1166718818eSStefano Zampini   contents = (Nest_Dense*)C->product->data;
1176718818eSStefano Zampini   if (!contents) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty");
1186718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1196718818eSStefano Zampini   nr   = bA->nr;
1206718818eSStefano Zampini   nc   = bA->nc;
12152c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
12252c5f739Sprj-   ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr);
12352c5f739Sprj-   ierr = MatZeroEntries(C);CHKERRQ(ierr);
12452c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
1256718818eSStefano Zampini   ierr = MatDenseGetArrayWrite(C,&carray);CHKERRQ(ierr);
12652c5f739Sprj-   for (i=0; i<nr; i++) {
12752c5f739Sprj-     ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr);
12852c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr);
1296718818eSStefano Zampini     ierr = MatDenseSetLDA(viewC,ldc);CHKERRQ(ierr);
13052c5f739Sprj-     for (j=0; j<nc; j++) {
13152c5f739Sprj-       if (!bA->m[i][j]) continue;
13252c5f739Sprj-       ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
13352c5f739Sprj-       ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
1346718818eSStefano Zampini       ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
1354222ddf1SHong Zhang 
1364222ddf1SHong Zhang       /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */
1374222ddf1SHong Zhang       workC             = contents->workC[i*nc + j];
1384222ddf1SHong Zhang       productB          = workC->product->B;
1394222ddf1SHong Zhang       workC->product->B = viewB; /* use newly created dense matrix viewB */
1406718818eSStefano Zampini       ierr = MatProductNumeric(workC);CHKERRQ(ierr);
14152c5f739Sprj-       ierr = MatDestroy(&viewB);CHKERRQ(ierr);
1424222ddf1SHong Zhang       workC->product->B = productB; /* resume original B */
1434222ddf1SHong Zhang 
14452c5f739Sprj-       /* C[i] <- workC + C[i] */
14552c5f739Sprj-       ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr);
14652c5f739Sprj-     }
14752c5f739Sprj-     ierr = MatDestroy(&viewC);CHKERRQ(ierr);
14852c5f739Sprj-   }
1496718818eSStefano Zampini   ierr = MatDenseRestoreArrayWrite(C,&carray);CHKERRQ(ierr);
15052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
1514222ddf1SHong Zhang 
1524222ddf1SHong Zhang   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1534222ddf1SHong Zhang   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15452c5f739Sprj-   PetscFunctionReturn(0);
15552c5f739Sprj- }
15652c5f739Sprj- 
15752c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
15852c5f739Sprj- {
15952c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
16052c5f739Sprj-   PetscInt       i;
16152c5f739Sprj-   PetscErrorCode ierr;
16252c5f739Sprj- 
16352c5f739Sprj-   PetscFunctionBegin;
16452c5f739Sprj-   ierr = PetscFree(contents->tarray);CHKERRQ(ierr);
16552c5f739Sprj-   for (i=0; i<contents->k; i++) {
16652c5f739Sprj-     ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr);
16752c5f739Sprj-   }
16852c5f739Sprj-   ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr);
16952c5f739Sprj-   ierr = PetscFree(contents);CHKERRQ(ierr);
17052c5f739Sprj-   PetscFunctionReturn(0);
17152c5f739Sprj- }
17252c5f739Sprj- 
1736718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C)
17452c5f739Sprj- {
1756718818eSStefano Zampini   Mat_Nest          *bA;
1766718818eSStefano Zampini   Mat               viewB,workC;
17752c5f739Sprj-   const PetscScalar *barray;
1786718818eSStefano Zampini   PetscInt          i,j,M,N,m,n,nr,nc,maxm = 0,ldb;
1794222ddf1SHong Zhang   Nest_Dense        *contents=NULL;
1806718818eSStefano Zampini   PetscBool         cisdense;
18152c5f739Sprj-   PetscErrorCode    ierr;
1826718818eSStefano Zampini   Mat               A,B;
1836718818eSStefano Zampini   PetscReal         fill;
18452c5f739Sprj- 
18552c5f739Sprj-   PetscFunctionBegin;
1866718818eSStefano Zampini   MatCheckProduct(C,4);
1876718818eSStefano Zampini   if (C->product->data) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty");
1886718818eSStefano Zampini   A    = C->product->A;
1896718818eSStefano Zampini   B    = C->product->B;
1906718818eSStefano Zampini   fill = C->product->fill;
1916718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1926718818eSStefano Zampini   nr   = bA->nr;
1936718818eSStefano Zampini   nc   = bA->nc;
1946718818eSStefano Zampini   ierr = MatGetLocalSize(B,NULL,&n);CHKERRQ(ierr);
19552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
19652c5f739Sprj-   ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr);
19752c5f739Sprj-   ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr);
1986718818eSStefano Zampini   ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1996718818eSStefano Zampini   ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,"");CHKERRQ(ierr);
2006718818eSStefano Zampini   if (!cisdense) {
2016718818eSStefano Zampini     ierr = MatSetType(C,((PetscObject)B)->type_name);CHKERRQ(ierr);
2026718818eSStefano Zampini   }
20318992e5dSStefano Zampini   ierr = MatSetUp(C);CHKERRQ(ierr);
2046718818eSStefano Zampini   if (!N) {
2056718818eSStefano Zampini     C->ops->productnumeric = MatProductNumeric_Nest_Dense;
2066718818eSStefano Zampini     PetscFunctionReturn(0);
20752c5f739Sprj-   }
20852c5f739Sprj- 
20952c5f739Sprj-   ierr = PetscNew(&contents);CHKERRQ(ierr);
2106718818eSStefano Zampini   C->product->data = contents;
2116718818eSStefano Zampini   C->product->destroy = MatNest_DenseDestroy;
21252c5f739Sprj-   ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr);
21352c5f739Sprj-   contents->k = nr*nc;
21452c5f739Sprj-   for (i=0; i<nr; i++) {
21552c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr);
21652c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
21752c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
21852c5f739Sprj-   }
21952c5f739Sprj-   for (i=0; i<nc; i++) {
22052c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr);
22152c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
22252c5f739Sprj-   }
22352c5f739Sprj-   ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr);
22452c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
22552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
22652c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
22752c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
22852c5f739Sprj-   for (j=0; j<nc; j++) {
22952c5f739Sprj-     ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
23052c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
2316718818eSStefano Zampini     ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
23252c5f739Sprj-     for (i=0; i<nr; i++) {
23352c5f739Sprj-       if (!bA->m[i][j]) continue;
23452c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
2354222ddf1SHong Zhang 
2364222ddf1SHong Zhang       ierr = MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]);CHKERRQ(ierr);
2374222ddf1SHong Zhang       workC = contents->workC[i*nc + j];
2384222ddf1SHong Zhang       ierr = MatProductSetType(workC,MATPRODUCT_AB);CHKERRQ(ierr);
2394222ddf1SHong Zhang       ierr = MatProductSetAlgorithm(workC,"default");CHKERRQ(ierr);
2404222ddf1SHong Zhang       ierr = MatProductSetFill(workC,fill);CHKERRQ(ierr);
2414222ddf1SHong Zhang       ierr = MatProductSetFromOptions(workC);CHKERRQ(ierr);
2424222ddf1SHong Zhang       ierr = MatProductSymbolic(workC);CHKERRQ(ierr);
2434222ddf1SHong Zhang 
2446718818eSStefano Zampini       /* since tarray will be shared by all Mat */
2456718818eSStefano Zampini       ierr = MatSeqDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
2466718818eSStefano Zampini       ierr = MatMPIDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
24752c5f739Sprj-     }
24852c5f739Sprj-     ierr = MatDestroy(&viewB);CHKERRQ(ierr);
24952c5f739Sprj-   }
25052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
25152c5f739Sprj- 
2526718818eSStefano Zampini   C->ops->productnumeric = MatProductNumeric_Nest_Dense;
25352c5f739Sprj-   PetscFunctionReturn(0);
25452c5f739Sprj- }
25552c5f739Sprj- 
2564222ddf1SHong Zhang /* --------------------------------------------------------- */
2574222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C)
2584222ddf1SHong Zhang {
2594222ddf1SHong Zhang   PetscFunctionBegin;
2606718818eSStefano Zampini   C->ops->productsymbolic = MatProductSymbolic_Nest_Dense;
2614222ddf1SHong Zhang   PetscFunctionReturn(0);
2624222ddf1SHong Zhang }
2634222ddf1SHong Zhang 
2644222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C)
26552c5f739Sprj- {
26652c5f739Sprj-   PetscErrorCode ierr;
2674222ddf1SHong Zhang   Mat_Product    *product = C->product;
26852c5f739Sprj- 
26952c5f739Sprj-   PetscFunctionBegin;
2704222ddf1SHong Zhang   if (product->type == MATPRODUCT_AB) {
2714222ddf1SHong Zhang     ierr = MatProductSetFromOptions_Nest_Dense_AB(C);CHKERRQ(ierr);
2726718818eSStefano Zampini   }
27352c5f739Sprj-   PetscFunctionReturn(0);
27452c5f739Sprj- }
2754222ddf1SHong Zhang /* --------------------------------------------------------- */
27652c5f739Sprj- 
277207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
278d8588912SDave May {
279d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
280207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
281207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
282d8588912SDave May   PetscErrorCode ierr;
283d8588912SDave May 
284d8588912SDave May   PetscFunctionBegin;
285609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
286609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
287207556f9SJed Brown   for (j=0; j<nc; j++) {
288609e31cbSJed Brown     ierr = VecZeroEntries(by[j]);CHKERRQ(ierr);
289609e31cbSJed Brown     for (i=0; i<nr; i++) {
2906c75ac25SJed Brown       if (!bA->m[i][j]) continue;
291609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
292609e31cbSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr);
293d8588912SDave May     }
294d8588912SDave May   }
295609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
296609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
297d8588912SDave May   PetscFunctionReturn(0);
298d8588912SDave May }
299d8588912SDave May 
3009194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
3019194d70fSJed Brown {
3029194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
3039194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
3049194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
3059194d70fSJed Brown   PetscErrorCode ierr;
3069194d70fSJed Brown 
3079194d70fSJed Brown   PetscFunctionBegin;
3089194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3099194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3109194d70fSJed Brown   for (j=0; j<nc; j++) {
3119194d70fSJed Brown     if (y != z) {
3129194d70fSJed Brown       Vec by;
3139194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3149194d70fSJed Brown       ierr = VecCopy(by,bz[j]);CHKERRQ(ierr);
3159194d70fSJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3169194d70fSJed Brown     }
3179194d70fSJed Brown     for (i=0; i<nr; i++) {
3186c75ac25SJed Brown       if (!bA->m[i][j]) continue;
3199194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
3209194d70fSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr);
3219194d70fSJed Brown     }
3229194d70fSJed Brown   }
3239194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3249194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3259194d70fSJed Brown   PetscFunctionReturn(0);
3269194d70fSJed Brown }
3279194d70fSJed Brown 
328f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
329f8170845SAlex Fikl {
330f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
331f8170845SAlex Fikl   Mat            C;
332f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
333f8170845SAlex Fikl   PetscErrorCode ierr;
334f8170845SAlex Fikl 
335f8170845SAlex Fikl   PetscFunctionBegin;
336cf37664fSBarry Smith   if (reuse == MAT_INPLACE_MATRIX && nr != nc) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
337f8170845SAlex Fikl 
338cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
339f8170845SAlex Fikl     Mat *subs;
340f8170845SAlex Fikl     IS  *is_row,*is_col;
341f8170845SAlex Fikl 
342f8170845SAlex Fikl     ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr);
343f8170845SAlex Fikl     ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr);
344f8170845SAlex Fikl     ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr);
345cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
346ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
347ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
348ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
349ddeb9bd8SAlex Fikl         }
350ddeb9bd8SAlex Fikl       }
351ddeb9bd8SAlex Fikl     }
352ddeb9bd8SAlex Fikl 
353f8170845SAlex Fikl     ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr);
354f8170845SAlex Fikl     ierr = PetscFree(subs);CHKERRQ(ierr);
3553d994f23SBarry Smith     ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr);
356f8170845SAlex Fikl   } else {
357f8170845SAlex Fikl     C = *B;
358f8170845SAlex Fikl   }
359f8170845SAlex Fikl 
360f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
361f8170845SAlex Fikl   for (i=0; i<nr; i++) {
362f8170845SAlex Fikl     for (j=0; j<nc; j++) {
363f8170845SAlex Fikl       if (bA->m[i][j]) {
364f8170845SAlex Fikl         ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr);
365f8170845SAlex Fikl       } else {
366f8170845SAlex Fikl         bC->m[j][i] = NULL;
367f8170845SAlex Fikl       }
368f8170845SAlex Fikl     }
369f8170845SAlex Fikl   }
370f8170845SAlex Fikl 
371cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
372f8170845SAlex Fikl     *B = C;
373f8170845SAlex Fikl   } else {
374f8170845SAlex Fikl     ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr);
375f8170845SAlex Fikl   }
376f8170845SAlex Fikl   PetscFunctionReturn(0);
377f8170845SAlex Fikl }
378f8170845SAlex Fikl 
379e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
380e2d7f03fSJed Brown {
381e2d7f03fSJed Brown   PetscErrorCode ierr;
382e2d7f03fSJed Brown   IS             *lst = *list;
383e2d7f03fSJed Brown   PetscInt       i;
384e2d7f03fSJed Brown 
385e2d7f03fSJed Brown   PetscFunctionBegin;
386e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3876bf464f9SBarry Smith   for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);}
388e2d7f03fSJed Brown   ierr  = PetscFree(lst);CHKERRQ(ierr);
3890298fd71SBarry Smith   *list = NULL;
390e2d7f03fSJed Brown   PetscFunctionReturn(0);
391e2d7f03fSJed Brown }
392e2d7f03fSJed Brown 
39306a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A)
394d8588912SDave May {
395d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
396d8588912SDave May   PetscInt       i,j;
397d8588912SDave May   PetscErrorCode ierr;
398d8588912SDave May 
399d8588912SDave May   PetscFunctionBegin;
400d8588912SDave May   /* release the matrices and the place holders */
401e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr);
402e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr);
403e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
404e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
405d8588912SDave May 
406d8588912SDave May   ierr = PetscFree(vs->row_len);CHKERRQ(ierr);
407d8588912SDave May   ierr = PetscFree(vs->col_len);CHKERRQ(ierr);
40806a1af2fSStefano Zampini   ierr = PetscFree(vs->nnzstate);CHKERRQ(ierr);
409d8588912SDave May 
410207556f9SJed Brown   ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr);
411207556f9SJed Brown 
412d8588912SDave May   /* release the matrices and the place holders */
413d8588912SDave May   if (vs->m) {
414d8588912SDave May     for (i=0; i<vs->nr; i++) {
415d8588912SDave May       for (j=0; j<vs->nc; j++) {
4166bf464f9SBarry Smith         ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr);
417d8588912SDave May       }
418d8588912SDave May       ierr = PetscFree(vs->m[i]);CHKERRQ(ierr);
419d8588912SDave May     }
420d8588912SDave May     ierr = PetscFree(vs->m);CHKERRQ(ierr);
421d8588912SDave May   }
42206a1af2fSStefano Zampini 
42306a1af2fSStefano Zampini   /* restore defaults */
42406a1af2fSStefano Zampini   vs->nr = 0;
42506a1af2fSStefano Zampini   vs->nc = 0;
42606a1af2fSStefano Zampini   vs->splitassembly = PETSC_FALSE;
42706a1af2fSStefano Zampini   PetscFunctionReturn(0);
42806a1af2fSStefano Zampini }
42906a1af2fSStefano Zampini 
43006a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A)
43106a1af2fSStefano Zampini {
43206a1af2fSStefano Zampini   PetscErrorCode ierr;
43306a1af2fSStefano Zampini 
43406a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
435bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
436d8588912SDave May 
437*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",NULL);CHKERRQ(ierr);
438*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",NULL);CHKERRQ(ierr);
439*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",NULL);CHKERRQ(ierr);
440*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",NULL);CHKERRQ(ierr);
441*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",NULL);CHKERRQ(ierr);
442*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",NULL);CHKERRQ(ierr);
443*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",NULL);CHKERRQ(ierr);
444*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",NULL);CHKERRQ(ierr);
445*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",NULL);CHKERRQ(ierr);
446*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",NULL);CHKERRQ(ierr);
447*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",NULL);CHKERRQ(ierr);
448*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",NULL);CHKERRQ(ierr);
449*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",NULL);CHKERRQ(ierr);
450*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",NULL);CHKERRQ(ierr);
4514222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL);CHKERRQ(ierr);
4524222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL);CHKERRQ(ierr);
4534222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL);CHKERRQ(ierr);
454d8588912SDave May   PetscFunctionReturn(0);
455d8588912SDave May }
456d8588912SDave May 
457381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd)
458381b8e50SStefano Zampini {
459381b8e50SStefano Zampini   Mat_Nest       *vs = (Mat_Nest*)mat->data;
460381b8e50SStefano Zampini   PetscInt       i;
461381b8e50SStefano Zampini   PetscErrorCode ierr;
462381b8e50SStefano Zampini 
463381b8e50SStefano Zampini   PetscFunctionBegin;
464381b8e50SStefano Zampini   if (dd) *dd = 0;
465381b8e50SStefano Zampini   if (!vs->nr) {
466381b8e50SStefano Zampini     *missing = PETSC_TRUE;
467381b8e50SStefano Zampini     PetscFunctionReturn(0);
468381b8e50SStefano Zampini   }
469381b8e50SStefano Zampini   *missing = PETSC_FALSE;
470381b8e50SStefano Zampini   for (i = 0; i < vs->nr && !(*missing); i++) {
471381b8e50SStefano Zampini     *missing = PETSC_TRUE;
472381b8e50SStefano Zampini     if (vs->m[i][i]) {
473381b8e50SStefano Zampini       ierr = MatMissingDiagonal(vs->m[i][i],missing,NULL);CHKERRQ(ierr);
474381b8e50SStefano Zampini       if (*missing && dd) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented");
475381b8e50SStefano Zampini     }
476381b8e50SStefano Zampini   }
477381b8e50SStefano Zampini   PetscFunctionReturn(0);
478381b8e50SStefano Zampini }
479381b8e50SStefano Zampini 
480207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
481d8588912SDave May {
482d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
483d8588912SDave May   PetscInt       i,j;
484d8588912SDave May   PetscErrorCode ierr;
48506a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
486d8588912SDave May 
487d8588912SDave May   PetscFunctionBegin;
488d8588912SDave May   for (i=0; i<vs->nr; i++) {
489d8588912SDave May     for (j=0; j<vs->nc; j++) {
49006a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
491e7c19651SJed Brown       if (vs->m[i][j]) {
492e7c19651SJed Brown         ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr);
493e7c19651SJed Brown         if (!vs->splitassembly) {
494e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
495e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
496e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
497e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
498e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
499e7c19651SJed Brown            */
500e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
50106a1af2fSStefano Zampini           ierr = MatGetNonzeroState(vs->m[i][j],&subnnzstate);CHKERRQ(ierr);
502e7c19651SJed Brown         }
503e7c19651SJed Brown       }
50406a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate);
50506a1af2fSStefano Zampini       vs->nnzstate[i*vs->nc+j] = subnnzstate;
506d8588912SDave May     }
507d8588912SDave May   }
50806a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
509d8588912SDave May   PetscFunctionReturn(0);
510d8588912SDave May }
511d8588912SDave May 
512207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
513d8588912SDave May {
514d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
515d8588912SDave May   PetscInt       i,j;
516d8588912SDave May   PetscErrorCode ierr;
517d8588912SDave May 
518d8588912SDave May   PetscFunctionBegin;
519d8588912SDave May   for (i=0; i<vs->nr; i++) {
520d8588912SDave May     for (j=0; j<vs->nc; j++) {
521e7c19651SJed Brown       if (vs->m[i][j]) {
522e7c19651SJed Brown         if (vs->splitassembly) {
523e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
524e7c19651SJed Brown         }
525e7c19651SJed Brown       }
526d8588912SDave May     }
527d8588912SDave May   }
528d8588912SDave May   PetscFunctionReturn(0);
529d8588912SDave May }
530d8588912SDave May 
531f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
532d8588912SDave May {
533207556f9SJed Brown   PetscErrorCode ierr;
534f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
535f349c1fdSJed Brown   PetscInt       j;
536f349c1fdSJed Brown   Mat            sub;
537d8588912SDave May 
538d8588912SDave May   PetscFunctionBegin;
5390298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
540f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
5414994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
542f349c1fdSJed Brown   *B = sub;
543f349c1fdSJed Brown   PetscFunctionReturn(0);
544d8588912SDave May }
545d8588912SDave May 
546f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
547f349c1fdSJed Brown {
548207556f9SJed Brown   PetscErrorCode ierr;
549f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
550f349c1fdSJed Brown   PetscInt       i;
551f349c1fdSJed Brown   Mat            sub;
552f349c1fdSJed Brown 
553f349c1fdSJed Brown   PetscFunctionBegin;
5540298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
555f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
5564994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
557f349c1fdSJed Brown   *B = sub;
558f349c1fdSJed Brown   PetscFunctionReturn(0);
559d8588912SDave May }
560d8588912SDave May 
56118d228c0SPierre Jolivet static PetscErrorCode MatNestFindISRange(Mat A,PetscInt n,const IS list[],IS is,PetscInt *begin,PetscInt *end)
562f349c1fdSJed Brown {
56318d228c0SPierre Jolivet   PetscInt       i,j,size,m;
564f349c1fdSJed Brown   PetscBool      flg;
56518d228c0SPierre Jolivet   IS             out,concatenate[2];
56618d228c0SPierre Jolivet   PetscErrorCode ierr;
567f349c1fdSJed Brown 
568f349c1fdSJed Brown   PetscFunctionBegin;
569f349c1fdSJed Brown   PetscValidPointer(list,3);
570f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
57118d228c0SPierre Jolivet   if (begin) {
57218d228c0SPierre Jolivet     PetscValidIntPointer(begin,5);
57318d228c0SPierre Jolivet     *begin = -1;
57418d228c0SPierre Jolivet   }
57518d228c0SPierre Jolivet   if (end) {
57618d228c0SPierre Jolivet     PetscValidIntPointer(end,6);
57718d228c0SPierre Jolivet     *end = -1;
57818d228c0SPierre Jolivet   }
579f349c1fdSJed Brown   for (i=0; i<n; i++) {
580207556f9SJed Brown     if (!list[i]) continue;
581320466b0SStefano Zampini     ierr = ISEqualUnsorted(list[i],is,&flg);CHKERRQ(ierr);
582f349c1fdSJed Brown     if (flg) {
58318d228c0SPierre Jolivet       if (begin) *begin = i;
58418d228c0SPierre Jolivet       if (end) *end = i+1;
585f349c1fdSJed Brown       PetscFunctionReturn(0);
586f349c1fdSJed Brown     }
587f349c1fdSJed Brown   }
58818d228c0SPierre Jolivet   ierr = ISGetSize(is,&size);CHKERRQ(ierr);
58918d228c0SPierre Jolivet   for (i=0; i<n-1; i++) {
59018d228c0SPierre Jolivet     if (!list[i]) continue;
59118d228c0SPierre Jolivet     m = 0;
59218d228c0SPierre Jolivet     ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,list+i,&out);CHKERRQ(ierr);
59318d228c0SPierre Jolivet     ierr = ISGetSize(out,&m);CHKERRQ(ierr);
59418d228c0SPierre Jolivet     for (j=i+2; j<n && m<size; j++) {
59518d228c0SPierre Jolivet       if (list[j]) {
59618d228c0SPierre Jolivet         concatenate[0] = out;
59718d228c0SPierre Jolivet         concatenate[1] = list[j];
59818d228c0SPierre Jolivet         ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,concatenate,&out);CHKERRQ(ierr);
59918d228c0SPierre Jolivet         ierr = ISDestroy(concatenate);CHKERRQ(ierr);
60018d228c0SPierre Jolivet         ierr = ISGetSize(out,&m);CHKERRQ(ierr);
60118d228c0SPierre Jolivet       }
60218d228c0SPierre Jolivet     }
60318d228c0SPierre Jolivet     if (m == size) {
60418d228c0SPierre Jolivet       ierr = ISEqualUnsorted(out,is,&flg);CHKERRQ(ierr);
60518d228c0SPierre Jolivet       if (flg) {
60618d228c0SPierre Jolivet         if (begin) *begin = i;
60718d228c0SPierre Jolivet         if (end) *end = j;
60818d228c0SPierre Jolivet         ierr = ISDestroy(&out);CHKERRQ(ierr);
60918d228c0SPierre Jolivet         PetscFunctionReturn(0);
61018d228c0SPierre Jolivet       }
61118d228c0SPierre Jolivet     }
61218d228c0SPierre Jolivet     ierr = ISDestroy(&out);CHKERRQ(ierr);
61318d228c0SPierre Jolivet   }
61418d228c0SPierre Jolivet   PetscFunctionReturn(0);
615f349c1fdSJed Brown }
616f349c1fdSJed Brown 
61718d228c0SPierre Jolivet 
61818d228c0SPierre Jolivet static PetscErrorCode MatNestFillEmptyMat_Private(Mat A,PetscInt i,PetscInt j,Mat *B)
6198188e55aSJed Brown {
6208188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
62118d228c0SPierre Jolivet   PetscInt       lr,lc;
62218d228c0SPierre Jolivet   PetscErrorCode ierr;
62318d228c0SPierre Jolivet 
62418d228c0SPierre Jolivet   PetscFunctionBegin;
62518d228c0SPierre Jolivet   ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr);
62618d228c0SPierre Jolivet   ierr = ISGetLocalSize(vs->isglobal.row[i],&lr);CHKERRQ(ierr);
62718d228c0SPierre Jolivet   ierr = ISGetLocalSize(vs->isglobal.col[j],&lc);CHKERRQ(ierr);
62818d228c0SPierre Jolivet   ierr = MatSetSizes(*B,lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
62918d228c0SPierre Jolivet   ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr);
63018d228c0SPierre Jolivet   ierr = MatSeqAIJSetPreallocation(*B,0,NULL);CHKERRQ(ierr);
63118d228c0SPierre Jolivet   ierr = MatMPIAIJSetPreallocation(*B,0,NULL,0,NULL);CHKERRQ(ierr);
63218d228c0SPierre Jolivet   ierr = MatSetUp(*B);CHKERRQ(ierr);
63318d228c0SPierre Jolivet   ierr = MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
63418d228c0SPierre Jolivet   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
63518d228c0SPierre Jolivet   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
63618d228c0SPierre Jolivet   PetscFunctionReturn(0);
63718d228c0SPierre Jolivet }
63818d228c0SPierre Jolivet 
63918d228c0SPierre Jolivet static PetscErrorCode MatNestGetBlock_Private(Mat A,PetscInt rbegin,PetscInt rend,PetscInt cbegin,PetscInt cend,Mat *B)
64018d228c0SPierre Jolivet {
64118d228c0SPierre Jolivet   Mat_Nest       *vs = (Mat_Nest*)A->data;
64218d228c0SPierre Jolivet   Mat            *a;
64318d228c0SPierre Jolivet   PetscInt       i,j,k,l,nr=rend-rbegin,nc=cend-cbegin;
6448188e55aSJed Brown   char           keyname[256];
64518d228c0SPierre Jolivet   PetscBool      *b;
64618d228c0SPierre Jolivet   PetscBool      flg;
6478188e55aSJed Brown   PetscErrorCode ierr;
6488188e55aSJed Brown 
6498188e55aSJed Brown   PetscFunctionBegin;
6500298fd71SBarry Smith   *B   = NULL;
65118d228c0SPierre Jolivet   ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestBlock_%D-%Dx%D-%D",rbegin,rend,cbegin,cend);CHKERRQ(ierr);
6528188e55aSJed Brown   ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr);
6538188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
6548188e55aSJed Brown 
65518d228c0SPierre Jolivet   ierr = PetscMalloc2(nr*nc,&a,nr*nc,&b);CHKERRQ(ierr);
65618d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
65718d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
65818d228c0SPierre Jolivet       a[i*nc + j] = vs->m[rbegin+i][cbegin+j];
65918d228c0SPierre Jolivet       b[i*nc + j] = PETSC_FALSE;
66018d228c0SPierre Jolivet     }
66118d228c0SPierre Jolivet   }
66218d228c0SPierre Jolivet   if (nc!=vs->nc&&nr!=vs->nr) {
66318d228c0SPierre Jolivet     for (i=0; i<nr; i++) {
66418d228c0SPierre Jolivet       for (j=0; j<nc; j++) {
66518d228c0SPierre Jolivet         flg = PETSC_FALSE;
66618d228c0SPierre Jolivet         for (k=0; (k<nr&&!flg); k++) {
66718d228c0SPierre Jolivet           if (a[j + k*nc]) flg = PETSC_TRUE;
66818d228c0SPierre Jolivet         }
66918d228c0SPierre Jolivet         if (flg) {
67018d228c0SPierre Jolivet           flg = PETSC_FALSE;
67118d228c0SPierre Jolivet           for (l=0; (l<nc&&!flg); l++) {
67218d228c0SPierre Jolivet             if (a[i*nc + l]) flg = PETSC_TRUE;
67318d228c0SPierre Jolivet           }
67418d228c0SPierre Jolivet         }
67518d228c0SPierre Jolivet         if (!flg) {
67618d228c0SPierre Jolivet           b[i*nc + j] = PETSC_TRUE;
67718d228c0SPierre Jolivet           ierr = MatNestFillEmptyMat_Private(A,rbegin+i,cbegin+j,a + i*nc + j);CHKERRQ(ierr);
67818d228c0SPierre Jolivet         }
67918d228c0SPierre Jolivet       }
68018d228c0SPierre Jolivet     }
68118d228c0SPierre Jolivet   }
68218d228c0SPierre Jolivet   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,nr!=vs->nr?NULL:vs->isglobal.row,nc,nc!=vs->nc?NULL:vs->isglobal.col,a,B);CHKERRQ(ierr);
68318d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
68418d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
68518d228c0SPierre Jolivet       if (b[i*nc + j]) {
68618d228c0SPierre Jolivet         ierr = MatDestroy(a + i*nc + j);CHKERRQ(ierr);
68718d228c0SPierre Jolivet       }
68818d228c0SPierre Jolivet     }
68918d228c0SPierre Jolivet   }
69018d228c0SPierre Jolivet   ierr = PetscFree2(a,b);CHKERRQ(ierr);
6918188e55aSJed Brown   (*B)->assembled = A->assembled;
6928188e55aSJed Brown   ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr);
6938188e55aSJed Brown   ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */
6948188e55aSJed Brown   PetscFunctionReturn(0);
6958188e55aSJed Brown }
6968188e55aSJed Brown 
697f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
698f349c1fdSJed Brown {
699f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
70018d228c0SPierre Jolivet   PetscInt       rbegin,rend,cbegin,cend;
7018188e55aSJed Brown   PetscErrorCode ierr;
702f349c1fdSJed Brown 
703f349c1fdSJed Brown   PetscFunctionBegin;
70418d228c0SPierre Jolivet   ierr = MatNestFindISRange(A,vs->nr,is->row,isrow,&rbegin,&rend);CHKERRQ(ierr);
70518d228c0SPierre Jolivet   ierr = MatNestFindISRange(A,vs->nc,is->col,iscol,&cbegin,&cend);CHKERRQ(ierr);
70618d228c0SPierre Jolivet   if (rend == rbegin + 1 && cend == cbegin + 1) {
70718d228c0SPierre Jolivet     if (!vs->m[rbegin][cbegin]) {
70818d228c0SPierre Jolivet       ierr = MatNestFillEmptyMat_Private(A,rbegin,cbegin,vs->m[rbegin] + cbegin);CHKERRQ(ierr);
70977019fcaSJed Brown     }
71018d228c0SPierre Jolivet     *B = vs->m[rbegin][cbegin];
71118d228c0SPierre Jolivet   } else if (rbegin != -1 && cbegin != -1) {
71218d228c0SPierre Jolivet     ierr = MatNestGetBlock_Private(A,rbegin,rend,cbegin,cend,B);CHKERRQ(ierr);
71318d228c0SPierre Jolivet   } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
714f349c1fdSJed Brown   PetscFunctionReturn(0);
715f349c1fdSJed Brown }
716f349c1fdSJed Brown 
71706a1af2fSStefano Zampini /*
71806a1af2fSStefano Zampini    TODO: This does not actually returns a submatrix we can modify
71906a1af2fSStefano Zampini */
7207dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
721f349c1fdSJed Brown {
722f349c1fdSJed Brown   PetscErrorCode ierr;
723f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
724f349c1fdSJed Brown   Mat            sub;
725f349c1fdSJed Brown 
726f349c1fdSJed Brown   PetscFunctionBegin;
727f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr);
728f349c1fdSJed Brown   switch (reuse) {
729f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
7307874fa86SDave May     if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); }
731f349c1fdSJed Brown     *B = sub;
732f349c1fdSJed Brown     break;
733f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
734ce94432eSBarry Smith     if (sub != *B) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
735f349c1fdSJed Brown     break;
736f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
737f349c1fdSJed Brown     break;
738511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
739511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
740f349c1fdSJed Brown   }
741f349c1fdSJed Brown   PetscFunctionReturn(0);
742f349c1fdSJed Brown }
743f349c1fdSJed Brown 
744f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
745f349c1fdSJed Brown {
746f349c1fdSJed Brown   PetscErrorCode ierr;
747f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
748f349c1fdSJed Brown   Mat            sub;
749f349c1fdSJed Brown 
750f349c1fdSJed Brown   PetscFunctionBegin;
751f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
752f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
753f349c1fdSJed Brown   if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);}
754f349c1fdSJed Brown   *B = sub;
755d8588912SDave May   PetscFunctionReturn(0);
756d8588912SDave May }
757d8588912SDave May 
758207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
759d8588912SDave May {
760d8588912SDave May   PetscErrorCode ierr;
761f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
762f349c1fdSJed Brown   Mat            sub;
763d8588912SDave May 
764d8588912SDave May   PetscFunctionBegin;
765f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
766ce94432eSBarry Smith   if (*B != sub) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
767f349c1fdSJed Brown   if (sub) {
768ce94432eSBarry Smith     if (((PetscObject)sub)->refct <= 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
7696bf464f9SBarry Smith     ierr = MatDestroy(B);CHKERRQ(ierr);
770d8588912SDave May   }
771d8588912SDave May   PetscFunctionReturn(0);
772d8588912SDave May }
773d8588912SDave May 
7747874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
7757874fa86SDave May {
7767874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
7777874fa86SDave May   PetscInt       i;
7787874fa86SDave May   PetscErrorCode ierr;
7797874fa86SDave May 
7807874fa86SDave May   PetscFunctionBegin;
7817874fa86SDave May   for (i=0; i<bA->nr; i++) {
782429bac76SJed Brown     Vec bv;
783429bac76SJed Brown     ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7847874fa86SDave May     if (bA->m[i][i]) {
785429bac76SJed Brown       ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr);
7867874fa86SDave May     } else {
7875159a857SMatthew G. Knepley       ierr = VecSet(bv,0.0);CHKERRQ(ierr);
7887874fa86SDave May     }
789429bac76SJed Brown     ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7907874fa86SDave May   }
7917874fa86SDave May   PetscFunctionReturn(0);
7927874fa86SDave May }
7937874fa86SDave May 
7947874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
7957874fa86SDave May {
7967874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
797429bac76SJed Brown   Vec            bl,*br;
7987874fa86SDave May   PetscInt       i,j;
7997874fa86SDave May   PetscErrorCode ierr;
8007874fa86SDave May 
8017874fa86SDave May   PetscFunctionBegin;
8023f800ebeSJed Brown   ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr);
8032e6472ebSElliott Sales de Andrade   if (r) {
804429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
8052e6472ebSElliott Sales de Andrade   }
8062e6472ebSElliott Sales de Andrade   bl = NULL;
8077874fa86SDave May   for (i=0; i<bA->nr; i++) {
8082e6472ebSElliott Sales de Andrade     if (l) {
809429bac76SJed Brown       ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
8102e6472ebSElliott Sales de Andrade     }
8117874fa86SDave May     for (j=0; j<bA->nc; j++) {
8127874fa86SDave May       if (bA->m[i][j]) {
813429bac76SJed Brown         ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr);
8147874fa86SDave May       }
8157874fa86SDave May     }
8162e6472ebSElliott Sales de Andrade     if (l) {
817a061e289SJed Brown       ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
8187874fa86SDave May     }
8192e6472ebSElliott Sales de Andrade   }
8202e6472ebSElliott Sales de Andrade   if (r) {
821429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
8222e6472ebSElliott Sales de Andrade   }
823429bac76SJed Brown   ierr = PetscFree(br);CHKERRQ(ierr);
8247874fa86SDave May   PetscFunctionReturn(0);
8257874fa86SDave May }
8267874fa86SDave May 
827a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
828a061e289SJed Brown {
829a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
830a061e289SJed Brown   PetscInt       i,j;
831a061e289SJed Brown   PetscErrorCode ierr;
832a061e289SJed Brown 
833a061e289SJed Brown   PetscFunctionBegin;
834a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
835a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
836a061e289SJed Brown       if (bA->m[i][j]) {
837a061e289SJed Brown         ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr);
838a061e289SJed Brown       }
839a061e289SJed Brown     }
840a061e289SJed Brown   }
841a061e289SJed Brown   PetscFunctionReturn(0);
842a061e289SJed Brown }
843a061e289SJed Brown 
844a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
845a061e289SJed Brown {
846a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
847a061e289SJed Brown   PetscInt       i;
848a061e289SJed Brown   PetscErrorCode ierr;
84906a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
850a061e289SJed Brown 
851a061e289SJed Brown   PetscFunctionBegin;
852a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
85306a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
854ce94432eSBarry Smith     if (!bA->m[i][i]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%D,%D)",i,i);
855a061e289SJed Brown     ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr);
85606a1af2fSStefano Zampini     ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
85706a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
85806a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
859a061e289SJed Brown   }
86006a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
861a061e289SJed Brown   PetscFunctionReturn(0);
862a061e289SJed Brown }
863a061e289SJed Brown 
86413135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
86513135bc6SAlex Fikl {
86613135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
86713135bc6SAlex Fikl   PetscInt       i;
86813135bc6SAlex Fikl   PetscErrorCode ierr;
86906a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
87013135bc6SAlex Fikl 
87113135bc6SAlex Fikl   PetscFunctionBegin;
87213135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
87306a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
87413135bc6SAlex Fikl     Vec              bv;
87513135bc6SAlex Fikl     ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
87613135bc6SAlex Fikl     if (bA->m[i][i]) {
87713135bc6SAlex Fikl       ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr);
87806a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
87913135bc6SAlex Fikl     }
88013135bc6SAlex Fikl     ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
88106a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
88206a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
88313135bc6SAlex Fikl   }
88406a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
88513135bc6SAlex Fikl   PetscFunctionReturn(0);
88613135bc6SAlex Fikl }
88713135bc6SAlex Fikl 
888f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
889f8170845SAlex Fikl {
890f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
891f8170845SAlex Fikl   PetscInt       i,j;
892f8170845SAlex Fikl   PetscErrorCode ierr;
893f8170845SAlex Fikl 
894f8170845SAlex Fikl   PetscFunctionBegin;
895f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
896f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
897f8170845SAlex Fikl       if (bA->m[i][j]) {
898f8170845SAlex Fikl         ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr);
899f8170845SAlex Fikl       }
900f8170845SAlex Fikl     }
901f8170845SAlex Fikl   }
902f8170845SAlex Fikl   PetscFunctionReturn(0);
903f8170845SAlex Fikl }
904f8170845SAlex Fikl 
9052a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
906d8588912SDave May {
907d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
908d8588912SDave May   Vec            *L,*R;
909d8588912SDave May   MPI_Comm       comm;
910d8588912SDave May   PetscInt       i,j;
911d8588912SDave May   PetscErrorCode ierr;
912d8588912SDave May 
913d8588912SDave May   PetscFunctionBegin;
914ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
915d8588912SDave May   if (right) {
916d8588912SDave May     /* allocate R */
917854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr);
918d8588912SDave May     /* Create the right vectors */
919d8588912SDave May     for (j=0; j<bA->nc; j++) {
920d8588912SDave May       for (i=0; i<bA->nr; i++) {
921d8588912SDave May         if (bA->m[i][j]) {
9222a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr);
923d8588912SDave May           break;
924d8588912SDave May         }
925d8588912SDave May       }
9266c4ed002SBarry Smith       if (i==bA->nr) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
927d8588912SDave May     }
928f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr);
929d8588912SDave May     /* hand back control to the nest vector */
930d8588912SDave May     for (j=0; j<bA->nc; j++) {
9316bf464f9SBarry Smith       ierr = VecDestroy(&R[j]);CHKERRQ(ierr);
932d8588912SDave May     }
933d8588912SDave May     ierr = PetscFree(R);CHKERRQ(ierr);
934d8588912SDave May   }
935d8588912SDave May 
936d8588912SDave May   if (left) {
937d8588912SDave May     /* allocate L */
938854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr);
939d8588912SDave May     /* Create the left vectors */
940d8588912SDave May     for (i=0; i<bA->nr; i++) {
941d8588912SDave May       for (j=0; j<bA->nc; j++) {
942d8588912SDave May         if (bA->m[i][j]) {
9432a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr);
944d8588912SDave May           break;
945d8588912SDave May         }
946d8588912SDave May       }
9476c4ed002SBarry Smith       if (j==bA->nc) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
948d8588912SDave May     }
949d8588912SDave May 
950f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr);
951d8588912SDave May     for (i=0; i<bA->nr; i++) {
9526bf464f9SBarry Smith       ierr = VecDestroy(&L[i]);CHKERRQ(ierr);
953d8588912SDave May     }
954d8588912SDave May 
955d8588912SDave May     ierr = PetscFree(L);CHKERRQ(ierr);
956d8588912SDave May   }
957d8588912SDave May   PetscFunctionReturn(0);
958d8588912SDave May }
959d8588912SDave May 
960207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
961d8588912SDave May {
962d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
96329e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
964d8588912SDave May   PetscInt       i,j;
965d8588912SDave May   PetscErrorCode ierr;
966d8588912SDave May 
967d8588912SDave May   PetscFunctionBegin;
968251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
969d8588912SDave May   if (isascii) {
970d8588912SDave May 
97129e60adbSStefano Zampini     ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr);
972d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr);
973d86155a6SBarry Smith     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
974d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%D, cols=%D \n",bA->nr,bA->nc);CHKERRQ(ierr);
975d8588912SDave May 
976d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr);
977d8588912SDave May     for (i=0; i<bA->nr; i++) {
978d8588912SDave May       for (j=0; j<bA->nc; j++) {
97919fd82e9SBarry Smith         MatType   type;
980270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
981d8588912SDave May         PetscInt  NR,NC;
982d8588912SDave May         PetscBool isNest = PETSC_FALSE;
983d8588912SDave May 
984d8588912SDave May         if (!bA->m[i][j]) {
98585019af4SBarry Smith           ierr = PetscViewerASCIIPrintf(viewer, "(%D,%D) : NULL \n",i,j);CHKERRQ(ierr);
986d8588912SDave May           continue;
987d8588912SDave May         }
988d8588912SDave May         ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr);
989d8588912SDave May         ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr);
9908caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);}
9918caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);}
992251f4c67SDmitry Karpeev         ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr);
993d8588912SDave May 
994270f95d7SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"(%D,%D) : %s%stype=%s, rows=%D, cols=%D \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr);
995d8588912SDave May 
99629e60adbSStefano Zampini         if (isNest || viewSub) {
997270f95d7SJed Brown           ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);  /* push1 */
998d8588912SDave May           ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr);
999270f95d7SJed Brown           ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop1 */
1000d8588912SDave May         }
1001d8588912SDave May       }
1002d8588912SDave May     }
1003d86155a6SBarry Smith     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop0 */
1004d8588912SDave May   }
1005d8588912SDave May   PetscFunctionReturn(0);
1006d8588912SDave May }
1007d8588912SDave May 
1008207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
1009d8588912SDave May {
1010d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1011d8588912SDave May   PetscInt       i,j;
1012d8588912SDave May   PetscErrorCode ierr;
1013d8588912SDave May 
1014d8588912SDave May   PetscFunctionBegin;
1015d8588912SDave May   for (i=0; i<bA->nr; i++) {
1016d8588912SDave May     for (j=0; j<bA->nc; j++) {
1017d8588912SDave May       if (!bA->m[i][j]) continue;
1018d8588912SDave May       ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr);
1019d8588912SDave May     }
1020d8588912SDave May   }
1021d8588912SDave May   PetscFunctionReturn(0);
1022d8588912SDave May }
1023d8588912SDave May 
1024c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
1025c222c20dSDavid Ham {
1026c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
1027c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1028c222c20dSDavid Ham   PetscErrorCode ierr;
102906a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
1030c222c20dSDavid Ham 
1031c222c20dSDavid Ham   PetscFunctionBegin;
1032c222c20dSDavid Ham   if (nr != bB->nr || nc != bB->nc) SETERRQ4(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%D,%D) to a Mat_Nest of block size (%D,%D)",bB->nr,bB->nc,nr,nc);
1033c222c20dSDavid Ham   for (i=0; i<nr; i++) {
1034c222c20dSDavid Ham     for (j=0; j<nc; j++) {
103506a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
103646a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
1037c222c20dSDavid Ham         ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr);
103846a2b97cSJed Brown       } else if (bA->m[i][j] || bB->m[i][j]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
103906a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bB->m[i][j],&subnnzstate);CHKERRQ(ierr);
104006a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate);
104106a1af2fSStefano Zampini       bB->nnzstate[i*nc+j] = subnnzstate;
1042c222c20dSDavid Ham     }
1043c222c20dSDavid Ham   }
104406a1af2fSStefano Zampini   if (nnzstate) B->nonzerostate++;
1045c222c20dSDavid Ham   PetscFunctionReturn(0);
1046c222c20dSDavid Ham }
1047c222c20dSDavid Ham 
10486e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
10496e76ffeaSPierre Jolivet {
10506e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
10516e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
10526e76ffeaSPierre Jolivet   PetscErrorCode ierr;
105306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
10546e76ffeaSPierre Jolivet 
10556e76ffeaSPierre Jolivet   PetscFunctionBegin;
10566e76ffeaSPierre Jolivet   if (nr != bX->nr || nc != bX->nc) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%D,%D) with a MatNest of block size (%D,%D)",bX->nr,bX->nc,nr,nc);
10576e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
10586e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
105906a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
10606e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
10616e76ffeaSPierre Jolivet         ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr);
1062c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
1063c066aebcSStefano Zampini         Mat M;
1064c066aebcSStefano Zampini 
1065060bfc19SStefano Zampini         if (str != DIFFERENT_NONZERO_PATTERN) SETERRQ2(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D. Use DIFFERENT_NONZERO_PATTERN",i,j);
1066c066aebcSStefano Zampini         ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr);
1067c066aebcSStefano Zampini         ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr);
1068c066aebcSStefano Zampini         ierr = MatDestroy(&M);CHKERRQ(ierr);
1069c066aebcSStefano Zampini       }
1070060bfc19SStefano Zampini       if (bY->m[i][j]) { ierr = MatGetNonzeroState(bY->m[i][j],&subnnzstate);CHKERRQ(ierr); }
107106a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate);
107206a1af2fSStefano Zampini       bY->nnzstate[i*nc+j] = subnnzstate;
10736e76ffeaSPierre Jolivet     }
10746e76ffeaSPierre Jolivet   }
107506a1af2fSStefano Zampini   if (nnzstate) Y->nonzerostate++;
10766e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
10776e76ffeaSPierre Jolivet }
10786e76ffeaSPierre Jolivet 
1079207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
1080d8588912SDave May {
1081d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1082841e96a3SJed Brown   Mat            *b;
1083841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1084d8588912SDave May   PetscErrorCode ierr;
1085d8588912SDave May 
1086d8588912SDave May   PetscFunctionBegin;
1087785e854fSJed Brown   ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr);
1088841e96a3SJed Brown   for (i=0; i<nr; i++) {
1089841e96a3SJed Brown     for (j=0; j<nc; j++) {
1090841e96a3SJed Brown       if (bA->m[i][j]) {
1091841e96a3SJed Brown         ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr);
1092841e96a3SJed Brown       } else {
10930298fd71SBarry Smith         b[i*nc+j] = NULL;
1094d8588912SDave May       }
1095d8588912SDave May     }
1096d8588912SDave May   }
1097ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr);
1098841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
1099841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
11006bf464f9SBarry Smith     ierr = MatDestroy(&b[i]);CHKERRQ(ierr);
1101d8588912SDave May   }
1102d8588912SDave May   ierr = PetscFree(b);CHKERRQ(ierr);
1103d8588912SDave May 
1104841e96a3SJed Brown   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1105841e96a3SJed Brown   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1106d8588912SDave May   PetscFunctionReturn(0);
1107d8588912SDave May }
1108d8588912SDave May 
1109d8588912SDave May /* nest api */
1110d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
1111d8588912SDave May {
1112d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
11135fd66863SKarl Rupp 
1114d8588912SDave May   PetscFunctionBegin;
1115ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1116ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
1117d8588912SDave May   *mat = bA->m[idxm][jdxm];
1118d8588912SDave May   PetscFunctionReturn(0);
1119d8588912SDave May }
1120d8588912SDave May 
11219ba0d327SJed Brown /*@
1122d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
1123d8588912SDave May 
1124d8588912SDave May  Not collective
1125d8588912SDave May 
1126d8588912SDave May  Input Parameters:
1127629881c0SJed Brown +   A  - nest matrix
1128d8588912SDave May .   idxm - index of the matrix within the nest matrix
1129629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
1130d8588912SDave May 
1131d8588912SDave May  Output Parameter:
1132d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
1133d8588912SDave May 
1134d8588912SDave May  Level: developer
1135d8588912SDave May 
1136bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(),
113779798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
1138d8588912SDave May @*/
11397087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
1140d8588912SDave May {
1141699a902aSJed Brown   PetscErrorCode ierr;
1142d8588912SDave May 
1143d8588912SDave May   PetscFunctionBegin;
1144699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr);
1145d8588912SDave May   PetscFunctionReturn(0);
1146d8588912SDave May }
1147d8588912SDave May 
11480782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
11490782ca92SJed Brown {
11500782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
11510782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
11520782ca92SJed Brown   PetscErrorCode ierr;
11530782ca92SJed Brown 
11540782ca92SJed Brown   PetscFunctionBegin;
1155ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1156ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
11570782ca92SJed Brown   ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr);
11580782ca92SJed Brown   ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr);
11590782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr);
11600782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr);
11610782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr);
11620782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr);
1163ce94432eSBarry Smith   if (M != Mi || N != Ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%D,%D) incompatible with nest block (%D,%D)",M,N,Mi,Ni);
1164ce94432eSBarry Smith   if (m != mi || n != ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%D,%D) incompatible with nest block (%D,%D)",m,n,mi,ni);
116526fbe8dcSKarl Rupp 
116606a1af2fSStefano Zampini   /* do not increase object state */
116706a1af2fSStefano Zampini   if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0);
116806a1af2fSStefano Zampini 
11690782ca92SJed Brown   ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr);
11700782ca92SJed Brown   ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr);
11710782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
117206a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
117306a1af2fSStefano Zampini   ierr = MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]);CHKERRQ(ierr);
117406a1af2fSStefano Zampini   A->nonzerostate++;
11750782ca92SJed Brown   PetscFunctionReturn(0);
11760782ca92SJed Brown }
11770782ca92SJed Brown 
11789ba0d327SJed Brown /*@
11790782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
11800782ca92SJed Brown 
11810782ca92SJed Brown  Logically collective on the submatrix communicator
11820782ca92SJed Brown 
11830782ca92SJed Brown  Input Parameters:
11840782ca92SJed Brown +   A  - nest matrix
11850782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
11860782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
11870782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
11880782ca92SJed Brown 
11890782ca92SJed Brown  Notes:
11900782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
11910782ca92SJed Brown 
11920782ca92SJed Brown  This increments the reference count of the submatrix.
11930782ca92SJed Brown 
11940782ca92SJed Brown  Level: developer
11950782ca92SJed Brown 
1196bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
119779798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
11980782ca92SJed Brown @*/
11990782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
12000782ca92SJed Brown {
12010782ca92SJed Brown   PetscErrorCode ierr;
12020782ca92SJed Brown 
12030782ca92SJed Brown   PetscFunctionBegin;
12040782ca92SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr);
12050782ca92SJed Brown   PetscFunctionReturn(0);
12060782ca92SJed Brown }
12070782ca92SJed Brown 
1208d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1209d8588912SDave May {
1210d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
12115fd66863SKarl Rupp 
1212d8588912SDave May   PetscFunctionBegin;
121326fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
121426fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
121526fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1216d8588912SDave May   PetscFunctionReturn(0);
1217d8588912SDave May }
1218d8588912SDave May 
1219d8588912SDave May /*@C
1220d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1221d8588912SDave May 
1222d8588912SDave May  Not collective
1223d8588912SDave May 
1224d8588912SDave May  Input Parameters:
1225629881c0SJed Brown .   A  - nest matrix
1226d8588912SDave May 
1227d8588912SDave May  Output Parameter:
1228629881c0SJed Brown +   M - number of rows in the nest matrix
1229d8588912SDave May .   N - number of cols in the nest matrix
1230629881c0SJed Brown -   mat - 2d array of matrices
1231d8588912SDave May 
1232d8588912SDave May  Notes:
1233d8588912SDave May 
1234d8588912SDave May  The user should not free the array mat.
1235d8588912SDave May 
1236351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1237351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1238351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1239351962e3SVincent Le Chenadec 
1240d8588912SDave May  Level: developer
1241d8588912SDave May 
1242bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
124379798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1244d8588912SDave May @*/
12457087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1246d8588912SDave May {
1247699a902aSJed Brown   PetscErrorCode ierr;
1248d8588912SDave May 
1249d8588912SDave May   PetscFunctionBegin;
1250699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr);
1251d8588912SDave May   PetscFunctionReturn(0);
1252d8588912SDave May }
1253d8588912SDave May 
12547087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1255d8588912SDave May {
1256d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1257d8588912SDave May 
1258d8588912SDave May   PetscFunctionBegin;
125926fbe8dcSKarl Rupp   if (M) *M = bA->nr;
126026fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1261d8588912SDave May   PetscFunctionReturn(0);
1262d8588912SDave May }
1263d8588912SDave May 
12649ba0d327SJed Brown /*@
1265d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1266d8588912SDave May 
1267d8588912SDave May  Not collective
1268d8588912SDave May 
1269d8588912SDave May  Input Parameters:
1270d8588912SDave May .   A  - nest matrix
1271d8588912SDave May 
1272d8588912SDave May  Output Parameter:
1273629881c0SJed Brown +   M - number of rows in the nested mat
1274629881c0SJed Brown -   N - number of cols in the nested mat
1275d8588912SDave May 
1276d8588912SDave May  Notes:
1277d8588912SDave May 
1278d8588912SDave May  Level: developer
1279d8588912SDave May 
1280bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(),
128179798668SBarry Smith           MatNestGetISs()
1282d8588912SDave May @*/
12837087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1284d8588912SDave May {
1285699a902aSJed Brown   PetscErrorCode ierr;
1286d8588912SDave May 
1287d8588912SDave May   PetscFunctionBegin;
1288699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr);
1289d8588912SDave May   PetscFunctionReturn(0);
1290d8588912SDave May }
1291d8588912SDave May 
1292f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1293900e7ff2SJed Brown {
1294900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1295900e7ff2SJed Brown   PetscInt i;
1296900e7ff2SJed Brown 
1297900e7ff2SJed Brown   PetscFunctionBegin;
1298900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1299900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1300900e7ff2SJed Brown   PetscFunctionReturn(0);
1301900e7ff2SJed Brown }
1302900e7ff2SJed Brown 
13033a4d7b9aSSatish Balay /*@C
1304900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1305900e7ff2SJed Brown 
1306900e7ff2SJed Brown  Not collective
1307900e7ff2SJed Brown 
1308900e7ff2SJed Brown  Input Parameters:
1309900e7ff2SJed Brown .   A  - nest matrix
1310900e7ff2SJed Brown 
1311900e7ff2SJed Brown  Output Parameter:
1312900e7ff2SJed Brown +   rows - array of row index sets
1313900e7ff2SJed Brown -   cols - array of column index sets
1314900e7ff2SJed Brown 
1315900e7ff2SJed Brown  Level: advanced
1316900e7ff2SJed Brown 
1317900e7ff2SJed Brown  Notes:
1318900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1319900e7ff2SJed Brown 
132079798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1321bb97c47cSPierre Jolivet           MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats()
1322900e7ff2SJed Brown @*/
1323900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1324900e7ff2SJed Brown {
1325900e7ff2SJed Brown   PetscErrorCode ierr;
1326900e7ff2SJed Brown 
1327900e7ff2SJed Brown   PetscFunctionBegin;
1328900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1329900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1330900e7ff2SJed Brown   PetscFunctionReturn(0);
1331900e7ff2SJed Brown }
1332900e7ff2SJed Brown 
1333f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1334900e7ff2SJed Brown {
1335900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1336900e7ff2SJed Brown   PetscInt i;
1337900e7ff2SJed Brown 
1338900e7ff2SJed Brown   PetscFunctionBegin;
1339900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1340900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1341900e7ff2SJed Brown   PetscFunctionReturn(0);
1342900e7ff2SJed Brown }
1343900e7ff2SJed Brown 
1344900e7ff2SJed Brown /*@C
1345900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1346900e7ff2SJed Brown 
1347900e7ff2SJed Brown  Not collective
1348900e7ff2SJed Brown 
1349900e7ff2SJed Brown  Input Parameters:
1350900e7ff2SJed Brown .   A  - nest matrix
1351900e7ff2SJed Brown 
1352900e7ff2SJed Brown  Output Parameter:
13530298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
13540298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1355900e7ff2SJed Brown 
1356900e7ff2SJed Brown  Level: advanced
1357900e7ff2SJed Brown 
1358900e7ff2SJed Brown  Notes:
1359900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1360900e7ff2SJed Brown 
1361bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(),
136279798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1363900e7ff2SJed Brown @*/
1364900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1365900e7ff2SJed Brown {
1366900e7ff2SJed Brown   PetscErrorCode ierr;
1367900e7ff2SJed Brown 
1368900e7ff2SJed Brown   PetscFunctionBegin;
1369900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1370900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1371900e7ff2SJed Brown   PetscFunctionReturn(0);
1372900e7ff2SJed Brown }
1373900e7ff2SJed Brown 
137419fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1375207556f9SJed Brown {
1376207556f9SJed Brown   PetscErrorCode ierr;
1377207556f9SJed Brown   PetscBool      flg;
1378207556f9SJed Brown 
1379207556f9SJed Brown   PetscFunctionBegin;
1380207556f9SJed Brown   ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr);
1381207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
13822a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
138312b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1384207556f9SJed Brown   PetscFunctionReturn(0);
1385207556f9SJed Brown }
1386207556f9SJed Brown 
1387207556f9SJed Brown /*@C
13882a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1389207556f9SJed Brown 
1390207556f9SJed Brown  Not collective
1391207556f9SJed Brown 
1392207556f9SJed Brown  Input Parameters:
1393207556f9SJed Brown +  A  - nest matrix
1394207556f9SJed Brown -  vtype - type to use for creating vectors
1395207556f9SJed Brown 
1396207556f9SJed Brown  Notes:
1397207556f9SJed Brown 
1398207556f9SJed Brown  Level: developer
1399207556f9SJed Brown 
1400bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest()
1401207556f9SJed Brown @*/
140219fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1403207556f9SJed Brown {
1404207556f9SJed Brown   PetscErrorCode ierr;
1405207556f9SJed Brown 
1406207556f9SJed Brown   PetscFunctionBegin;
140719fd82e9SBarry Smith   ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr);
1408207556f9SJed Brown   PetscFunctionReturn(0);
1409207556f9SJed Brown }
1410207556f9SJed Brown 
1411c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1412d8588912SDave May {
1413c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1414c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
1415d8588912SDave May   PetscErrorCode ierr;
141606a1af2fSStefano Zampini   PetscBool      cong;
1417d8588912SDave May 
1418d8588912SDave May   PetscFunctionBegin;
141906a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
142006a1af2fSStefano Zampini 
1421c8883902SJed Brown   s->nr = nr;
1422c8883902SJed Brown   s->nc = nc;
1423d8588912SDave May 
1424c8883902SJed Brown   /* Create space for submatrices */
1425854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr);
1426c8883902SJed Brown   for (i=0; i<nr; i++) {
1427854ce69bSBarry Smith     ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr);
1428d8588912SDave May   }
1429c8883902SJed Brown   for (i=0; i<nr; i++) {
1430c8883902SJed Brown     for (j=0; j<nc; j++) {
1431c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1432c8883902SJed Brown       if (a[i*nc+j]) {
1433c8883902SJed Brown         ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr);
1434d8588912SDave May       }
1435d8588912SDave May     }
1436d8588912SDave May   }
1437d8588912SDave May 
14388188e55aSJed Brown   ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr);
1439d8588912SDave May 
1440854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr);
1441854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr);
1442c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1443c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1444d8588912SDave May 
144506a1af2fSStefano Zampini   ierr = PetscCalloc1(nr*nc,&s->nnzstate);CHKERRQ(ierr);
144606a1af2fSStefano Zampini   for (i=0; i<nr; i++) {
144706a1af2fSStefano Zampini     for (j=0; j<nc; j++) {
144806a1af2fSStefano Zampini       if (s->m[i][j]) {
144906a1af2fSStefano Zampini         ierr = MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]);CHKERRQ(ierr);
145006a1af2fSStefano Zampini       }
145106a1af2fSStefano Zampini     }
145206a1af2fSStefano Zampini   }
145306a1af2fSStefano Zampini 
14548188e55aSJed Brown   ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr);
1455d8588912SDave May 
1456c8883902SJed Brown   ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr);
1457c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr);
1458c8883902SJed Brown   ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr);
1459c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr);
1460c8883902SJed Brown 
1461c8883902SJed Brown   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
1462c8883902SJed Brown   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
1463c8883902SJed Brown 
146406a1af2fSStefano Zampini   /* disable operations that are not supported for non-square matrices,
146506a1af2fSStefano Zampini      or matrices for which is_row != is_col  */
146606a1af2fSStefano Zampini   ierr = MatHasCongruentLayouts(A,&cong);CHKERRQ(ierr);
146706a1af2fSStefano Zampini   if (cong && nr != nc) cong = PETSC_FALSE;
146806a1af2fSStefano Zampini   if (cong) {
146906a1af2fSStefano Zampini     for (i = 0; cong && i < nr; i++) {
1470320466b0SStefano Zampini       ierr = ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong);CHKERRQ(ierr);
147106a1af2fSStefano Zampini     }
147206a1af2fSStefano Zampini   }
147306a1af2fSStefano Zampini   if (!cong) {
1474381b8e50SStefano Zampini     A->ops->missingdiagonal = NULL;
147506a1af2fSStefano Zampini     A->ops->getdiagonal     = NULL;
147606a1af2fSStefano Zampini     A->ops->shift           = NULL;
147706a1af2fSStefano Zampini     A->ops->diagonalset     = NULL;
147806a1af2fSStefano Zampini   }
147906a1af2fSStefano Zampini 
14801795a4d1SJed Brown   ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr);
148106a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
148206a1af2fSStefano Zampini   A->nonzerostate++;
1483d8588912SDave May   PetscFunctionReturn(0);
1484d8588912SDave May }
1485d8588912SDave May 
1486c8883902SJed Brown /*@
1487c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1488c8883902SJed Brown 
1489c8883902SJed Brown    Collective on Mat
1490c8883902SJed Brown 
1491c8883902SJed Brown    Input Parameter:
1492ffd6319bSRichard Tran Mills +  A - nested matrix
1493c8883902SJed Brown .  nr - number of nested row blocks
14940298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1495c8883902SJed Brown .  nc - number of nested column blocks
14960298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
14970298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1498c8883902SJed Brown 
149906a1af2fSStefano Zampini    Notes: this always resets any submatrix information previously set
150006a1af2fSStefano Zampini 
1501c8883902SJed Brown    Level: advanced
1502c8883902SJed Brown 
150379798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1504c8883902SJed Brown @*/
1505c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1506c8883902SJed Brown {
1507c8883902SJed Brown   PetscErrorCode ierr;
150806a1af2fSStefano Zampini   PetscInt       i;
1509c8883902SJed Brown 
1510c8883902SJed Brown   PetscFunctionBegin;
1511c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1512ce94432eSBarry Smith   if (nr < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1513c8883902SJed Brown   if (nr && is_row) {
1514c8883902SJed Brown     PetscValidPointer(is_row,3);
1515c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1516c8883902SJed Brown   }
1517ce94432eSBarry Smith   if (nc < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
15181664e352SJed Brown   if (nc && is_col) {
1519c8883902SJed Brown     PetscValidPointer(is_col,5);
15209b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1521c8883902SJed Brown   }
152206a1af2fSStefano Zampini   if (nr*nc > 0) PetscValidPointer(a,6);
1523c8883902SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr);
1524c8883902SJed Brown   PetscFunctionReturn(0);
1525c8883902SJed Brown }
1526d8588912SDave May 
152745b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
152877019fcaSJed Brown {
152977019fcaSJed Brown   PetscErrorCode ierr;
153077019fcaSJed Brown   PetscBool      flg;
153177019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
153277019fcaSJed Brown 
153377019fcaSJed Brown   PetscFunctionBegin;
1534aea6d515SStefano Zampini   *ltog = NULL;
153577019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
153677019fcaSJed Brown     if (islocal[i]) {
1537aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
153877019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
153977019fcaSJed Brown     } else {
1540aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
154177019fcaSJed Brown     }
154277019fcaSJed Brown     m += mi;
154377019fcaSJed Brown   }
1544aea6d515SStefano Zampini   if (!flg) PetscFunctionReturn(0);
1545aea6d515SStefano Zampini 
1546785e854fSJed Brown   ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr);
1547165cd838SBarry Smith   for (i=0,m=0; i<n; i++) {
15480298fd71SBarry Smith     ISLocalToGlobalMapping smap = NULL;
1549e108cb99SStefano Zampini     Mat                    sub = NULL;
1550f6d38dbbSStefano Zampini     PetscSF                sf;
1551f6d38dbbSStefano Zampini     PetscLayout            map;
1552aea6d515SStefano Zampini     const PetscInt         *ix2;
155377019fcaSJed Brown 
1554165cd838SBarry Smith     if (!colflg) {
155577019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
155677019fcaSJed Brown     } else {
155777019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
155877019fcaSJed Brown     }
1559191fd14bSBarry Smith     if (sub) {
1560191fd14bSBarry Smith       if (!colflg) {
1561191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr);
1562191fd14bSBarry Smith       } else {
1563191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr);
1564191fd14bSBarry Smith       }
1565191fd14bSBarry Smith     }
156677019fcaSJed Brown     /*
156777019fcaSJed Brown        Now we need to extract the monolithic global indices that correspond to the given split global indices.
156877019fcaSJed Brown        In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
156977019fcaSJed Brown     */
1570aea6d515SStefano Zampini     ierr = ISGetIndices(isglobal[i],&ix2);CHKERRQ(ierr);
1571aea6d515SStefano Zampini     if (islocal[i]) {
1572aea6d515SStefano Zampini       PetscInt *ilocal,*iremote;
1573aea6d515SStefano Zampini       PetscInt mil,nleaves;
1574aea6d515SStefano Zampini 
1575aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
1576aea6d515SStefano Zampini       if (!smap) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map");
1577aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = j;
1578aea6d515SStefano Zampini       ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr);
1579aea6d515SStefano Zampini 
1580aea6d515SStefano Zampini       /* PetscSFSetGraphLayout does not like negative indices */
1581aea6d515SStefano Zampini       ierr = PetscMalloc2(mi,&ilocal,mi,&iremote);CHKERRQ(ierr);
1582aea6d515SStefano Zampini       for (j=0, nleaves = 0; j<mi; j++) {
1583aea6d515SStefano Zampini         if (ix[m+j] < 0) continue;
1584aea6d515SStefano Zampini         ilocal[nleaves]  = j;
1585aea6d515SStefano Zampini         iremote[nleaves] = ix[m+j];
1586aea6d515SStefano Zampini         nleaves++;
1587aea6d515SStefano Zampini       }
1588aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mil);CHKERRQ(ierr);
1589aea6d515SStefano Zampini       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A),&sf);CHKERRQ(ierr);
1590aea6d515SStefano Zampini       ierr = PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map);CHKERRQ(ierr);
1591aea6d515SStefano Zampini       ierr = PetscLayoutSetLocalSize(map,mil);CHKERRQ(ierr);
1592f6d38dbbSStefano Zampini       ierr = PetscLayoutSetUp(map);CHKERRQ(ierr);
1593aea6d515SStefano Zampini       ierr = PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote);CHKERRQ(ierr);
1594f6d38dbbSStefano Zampini       ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr);
1595f6d38dbbSStefano Zampini       ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1596f6d38dbbSStefano Zampini       ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1597f6d38dbbSStefano Zampini       ierr = PetscSFDestroy(&sf);CHKERRQ(ierr);
1598aea6d515SStefano Zampini       ierr = PetscFree2(ilocal,iremote);CHKERRQ(ierr);
1599aea6d515SStefano Zampini     } else {
1600aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
1601aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = ix2[i];
1602aea6d515SStefano Zampini     }
1603aea6d515SStefano Zampini     ierr = ISRestoreIndices(isglobal[i],&ix2);CHKERRQ(ierr);
160477019fcaSJed Brown     m   += mi;
160577019fcaSJed Brown   }
1606f0413b6fSBarry Smith   ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr);
160777019fcaSJed Brown   PetscFunctionReturn(0);
160877019fcaSJed Brown }
160977019fcaSJed Brown 
161077019fcaSJed Brown 
1611d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1612d8588912SDave May /*
1613d8588912SDave May   nprocessors = NP
1614d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1615d8588912SDave May        proc 0: => (g_0,h_0,)
1616d8588912SDave May        proc 1: => (g_1,h_1,)
1617d8588912SDave May        ...
1618d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1619d8588912SDave May 
1620d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1621d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1622d8588912SDave May 
1623d8588912SDave May             proc 0:
1624d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1625d8588912SDave May             proc 1:
1626d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1627d8588912SDave May 
1628d8588912SDave May             proc NP-1:
1629d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1630d8588912SDave May */
1631841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1632d8588912SDave May {
1633e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
16348188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
1635d8588912SDave May   PetscErrorCode ierr;
16360298fd71SBarry Smith   Mat            sub = NULL;
1637d8588912SDave May 
1638d8588912SDave May   PetscFunctionBegin;
1639854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr);
1640854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr);
1641d8588912SDave May   if (is_row) { /* valid IS is passed in */
1642d8588912SDave May     /* refs on is[] are incremeneted */
1643e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1644d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr);
164526fbe8dcSKarl Rupp 
1646e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1647d8588912SDave May     }
16482ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
16498188e55aSJed Brown     nsum = 0;
16508188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
16518188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
1652ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %D",i);
16530298fd71SBarry Smith       ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
1654ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16558188e55aSJed Brown       nsum += n;
16568188e55aSJed Brown     }
165755b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
165830bc264bSJed Brown     offset -= nsum;
1659e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1660f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16610298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
166273b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1663ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr);
1664e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr);
16652ae74bdbSJed Brown       offset += n;
1666d8588912SDave May     }
1667d8588912SDave May   }
1668d8588912SDave May 
1669d8588912SDave May   if (is_col) { /* valid IS is passed in */
1670d8588912SDave May     /* refs on is[] are incremeneted */
1671e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1672d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr);
167326fbe8dcSKarl Rupp 
1674e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1675d8588912SDave May     }
16762ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
16772ae74bdbSJed Brown     offset = A->cmap->rstart;
16788188e55aSJed Brown     nsum   = 0;
16798188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
16808188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
1681ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %D",i);
16820298fd71SBarry Smith       ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
1683ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16848188e55aSJed Brown       nsum += n;
16858188e55aSJed Brown     }
168655b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
168730bc264bSJed Brown     offset -= nsum;
1688e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1689f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
16900298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
169173b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1692ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr);
1693e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr);
16942ae74bdbSJed Brown       offset += n;
1695d8588912SDave May     }
1696d8588912SDave May   }
1697e2d7f03fSJed Brown 
1698e2d7f03fSJed Brown   /* Set up the local ISs */
1699785e854fSJed Brown   ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
1700785e854fSJed Brown   ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
1701e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1702e2d7f03fSJed Brown     IS                     isloc;
17030298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1704e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1705e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
17060298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);}
1707207556f9SJed Brown     if (rmap) {
170873b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1709e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr);
1710e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1711e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1712207556f9SJed Brown     } else {
1713207556f9SJed Brown       nlocal = 0;
17140298fd71SBarry Smith       isloc  = NULL;
1715207556f9SJed Brown     }
1716e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1717e2d7f03fSJed Brown     offset            += nlocal;
1718e2d7f03fSJed Brown   }
17198188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1720e2d7f03fSJed Brown     IS                     isloc;
17210298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1722e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1723e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
17240298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);}
1725207556f9SJed Brown     if (cmap) {
172673b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1727e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr);
1728e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1729e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1730207556f9SJed Brown     } else {
1731207556f9SJed Brown       nlocal = 0;
17320298fd71SBarry Smith       isloc  = NULL;
1733207556f9SJed Brown     }
1734e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1735e2d7f03fSJed Brown     offset            += nlocal;
1736e2d7f03fSJed Brown   }
17370189643fSJed Brown 
173877019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
173977019fcaSJed Brown   {
174045b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
174145b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr);
174245b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr);
174377019fcaSJed Brown     if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);}
174477019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr);
174577019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr);
174677019fcaSJed Brown   }
174777019fcaSJed Brown 
174876bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
17490189643fSJed Brown     for (i=0; i<vs->nr; i++) {
17500189643fSJed Brown       for (j=0; j<vs->nc; j++) {
17510189643fSJed Brown         PetscInt m,n,M,N,mi,ni,Mi,Ni;
17520189643fSJed Brown         Mat      B = vs->m[i][j];
17530189643fSJed Brown         if (!B) continue;
17540189643fSJed Brown         ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr);
17550189643fSJed Brown         ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr);
17560189643fSJed Brown         ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr);
17570189643fSJed Brown         ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr);
17580189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr);
17590189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr);
1760ce94432eSBarry Smith         if (M != Mi || N != Ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",M,N,i,j,Mi,Ni);
1761ce94432eSBarry Smith         if (m != mi || n != ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",m,n,i,j,mi,ni);
17620189643fSJed Brown       }
17630189643fSJed Brown     }
176476bd3646SJed Brown   }
1765a061e289SJed Brown 
1766a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1767a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1768a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1769a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1770a061e289SJed Brown     }
1771a061e289SJed Brown   }
1772a061e289SJed Brown   A->assembled = PETSC_TRUE;
1773d8588912SDave May   PetscFunctionReturn(0);
1774d8588912SDave May }
1775d8588912SDave May 
177645c38901SJed Brown /*@C
1777659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1778659c6bb0SJed Brown 
1779659c6bb0SJed Brown    Collective on Mat
1780659c6bb0SJed Brown 
1781659c6bb0SJed Brown    Input Parameter:
1782659c6bb0SJed Brown +  comm - Communicator for the new Mat
1783659c6bb0SJed Brown .  nr - number of nested row blocks
17840298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1785659c6bb0SJed Brown .  nc - number of nested column blocks
17860298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
17870298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1788659c6bb0SJed Brown 
1789659c6bb0SJed Brown    Output Parameter:
1790659c6bb0SJed Brown .  B - new matrix
1791659c6bb0SJed Brown 
1792659c6bb0SJed Brown    Level: advanced
1793659c6bb0SJed Brown 
179479798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
179579798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
179679798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1797659c6bb0SJed Brown @*/
17987087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1799d8588912SDave May {
1800d8588912SDave May   Mat            A;
1801d8588912SDave May   PetscErrorCode ierr;
1802d8588912SDave May 
1803d8588912SDave May   PetscFunctionBegin;
1804f4259b30SLisandro Dalcin   *B   = NULL;
1805d8588912SDave May   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
1806c8883902SJed Brown   ierr = MatSetType(A,MATNEST);CHKERRQ(ierr);
180791a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
1808c8883902SJed Brown   ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr);
1809d8588912SDave May   *B   = A;
1810d8588912SDave May   PetscFunctionReturn(0);
1811d8588912SDave May }
1812659c6bb0SJed Brown 
1813*be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1814b68353e5Sstefano_zampini {
1815b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
181623875855Sstefano_zampini   Mat            *trans;
1817b68353e5Sstefano_zampini   PetscScalar    **avv;
1818b68353e5Sstefano_zampini   PetscScalar    *vv;
1819b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1820b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1821b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1822b68353e5Sstefano_zampini   PetscBool      done;
1823b68353e5Sstefano_zampini   PetscErrorCode ierr;
1824b68353e5Sstefano_zampini 
1825b68353e5Sstefano_zampini   PetscFunctionBegin;
1826b68353e5Sstefano_zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
1827b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1828b68353e5Sstefano_zampini     PetscInt rnr;
1829b68353e5Sstefano_zampini 
1830b68353e5Sstefano_zampini     ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
1831b68353e5Sstefano_zampini     if (!done) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
1832b68353e5Sstefano_zampini     if (rnr != nr) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
1833b68353e5Sstefano_zampini     ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr);
1834b68353e5Sstefano_zampini   }
1835b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1836b68353e5Sstefano_zampini   nnz  = 0;
183723875855Sstefano_zampini   ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr);
1838b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1839b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1840b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1841b68353e5Sstefano_zampini       if (B) {
1842b68353e5Sstefano_zampini         PetscScalar *naa;
1843b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
184423875855Sstefano_zampini         PetscBool   istrans;
1845b68353e5Sstefano_zampini 
184623875855Sstefano_zampini         ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
184723875855Sstefano_zampini         if (istrans) {
184823875855Sstefano_zampini           Mat Bt;
184923875855Sstefano_zampini 
185023875855Sstefano_zampini           ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
185123875855Sstefano_zampini           ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr);
185223875855Sstefano_zampini           B    = trans[i*nest->nc+j];
185323875855Sstefano_zampini         }
1854b68353e5Sstefano_zampini         ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr);
1855b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
1856b68353e5Sstefano_zampini         ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr);
1857b68353e5Sstefano_zampini         nnz += nii[nnr];
1858b68353e5Sstefano_zampini 
1859b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1860b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1861b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1862b68353e5Sstefano_zampini       }
1863b68353e5Sstefano_zampini     }
1864b68353e5Sstefano_zampini   }
1865b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
1866b68353e5Sstefano_zampini     ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr);
1867b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr);
1868b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr);
1869b68353e5Sstefano_zampini   } else {
1870b68353e5Sstefano_zampini     if (nnz != ii[nr]) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1871b68353e5Sstefano_zampini   }
1872b68353e5Sstefano_zampini 
1873b68353e5Sstefano_zampini   /* new row pointer */
1874580bdb30SBarry Smith   ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr);
1875b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1876b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1877b68353e5Sstefano_zampini 
1878b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1879b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1880b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1881b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1882b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1883b68353e5Sstefano_zampini         PetscInt    ir;
1884b68353e5Sstefano_zampini 
1885b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1886b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1887b68353e5Sstefano_zampini           nii++;
1888b68353e5Sstefano_zampini         }
1889b68353e5Sstefano_zampini       }
1890b68353e5Sstefano_zampini     }
1891b68353e5Sstefano_zampini   }
1892b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1893b68353e5Sstefano_zampini 
1894b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
1895b68353e5Sstefano_zampini   ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr);
1896b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1897b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1898b68353e5Sstefano_zampini 
1899b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1900b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1901b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1902b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1903b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1904b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1905b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1906b68353e5Sstefano_zampini         PetscInt    ir,cst;
1907b68353e5Sstefano_zampini 
1908b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr);
1909b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1910b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1911b68353e5Sstefano_zampini 
1912b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1913b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1914b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1915b68353e5Sstefano_zampini             njj++;
1916b68353e5Sstefano_zampini             nvv++;
1917b68353e5Sstefano_zampini           }
1918b68353e5Sstefano_zampini           ci[ir] += rsize;
1919b68353e5Sstefano_zampini           nii++;
1920b68353e5Sstefano_zampini         }
1921b68353e5Sstefano_zampini       }
1922b68353e5Sstefano_zampini     }
1923b68353e5Sstefano_zampini   }
1924b68353e5Sstefano_zampini   ierr = PetscFree(ci);CHKERRQ(ierr);
1925b68353e5Sstefano_zampini 
1926b68353e5Sstefano_zampini   /* restore info */
1927b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1928b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1929b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1930b68353e5Sstefano_zampini       if (B) {
1931b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
193223875855Sstefano_zampini 
193323875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
1934b68353e5Sstefano_zampini         ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr);
1935b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
1936b68353e5Sstefano_zampini         ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr);
193723875855Sstefano_zampini         ierr = MatDestroy(&trans[k]);CHKERRQ(ierr);
1938b68353e5Sstefano_zampini       }
1939b68353e5Sstefano_zampini     }
1940b68353e5Sstefano_zampini   }
194123875855Sstefano_zampini   ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr);
1942b68353e5Sstefano_zampini 
1943b68353e5Sstefano_zampini   /* finalize newmat */
1944b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
1945b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr);
1946b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1947b68353e5Sstefano_zampini     Mat B;
1948b68353e5Sstefano_zampini 
1949b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr);
1950b68353e5Sstefano_zampini     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
1951b68353e5Sstefano_zampini   }
1952b68353e5Sstefano_zampini   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1953b68353e5Sstefano_zampini   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1954b68353e5Sstefano_zampini   {
1955b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1956b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1957b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1958b68353e5Sstefano_zampini   }
1959b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1960b68353e5Sstefano_zampini }
1961b68353e5Sstefano_zampini 
1962*be705e3aSPierre Jolivet PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y,PetscScalar a,Mat X)
1963*be705e3aSPierre Jolivet {
1964*be705e3aSPierre Jolivet   Mat_Nest       *nest = (Mat_Nest*)X->data;
1965*be705e3aSPierre Jolivet   PetscInt       i,j,k,rstart;
1966*be705e3aSPierre Jolivet   PetscBool      flg;
1967*be705e3aSPierre Jolivet   PetscErrorCode ierr;
1968*be705e3aSPierre Jolivet 
1969*be705e3aSPierre Jolivet   PetscFunctionBegin;
1970*be705e3aSPierre Jolivet   /* Fill by row */
1971*be705e3aSPierre Jolivet   for (j=0; j<nest->nc; ++j) {
1972*be705e3aSPierre Jolivet     /* Using global column indices and ISAllGather() is not scalable. */
1973*be705e3aSPierre Jolivet     IS             bNis;
1974*be705e3aSPierre Jolivet     PetscInt       bN;
1975*be705e3aSPierre Jolivet     const PetscInt *bNindices;
1976*be705e3aSPierre Jolivet     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
1977*be705e3aSPierre Jolivet     ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr);
1978*be705e3aSPierre Jolivet     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
1979*be705e3aSPierre Jolivet     for (i=0; i<nest->nr; ++i) {
1980*be705e3aSPierre Jolivet       Mat            B,D=NULL;
1981*be705e3aSPierre Jolivet       PetscInt       bm, br;
1982*be705e3aSPierre Jolivet       const PetscInt *bmindices;
1983*be705e3aSPierre Jolivet       B = nest->m[i][j];
1984*be705e3aSPierre Jolivet       if (!B) continue;
1985*be705e3aSPierre Jolivet       ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&flg);CHKERRQ(ierr);
1986*be705e3aSPierre Jolivet       if (flg) {
1987*be705e3aSPierre Jolivet         ierr = PetscTryMethod(B,"MatTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr);
1988*be705e3aSPierre Jolivet         ierr = PetscTryMethod(B,"MatHermitianTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr);
1989*be705e3aSPierre Jolivet         ierr = MatConvert(B,((PetscObject)D)->type_name,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr);
1990*be705e3aSPierre Jolivet         B = D;
1991*be705e3aSPierre Jolivet       }
1992*be705e3aSPierre Jolivet       ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQSBAIJ,MATMPISBAIJ,"");CHKERRQ(ierr);
1993*be705e3aSPierre Jolivet       if (flg) {
1994*be705e3aSPierre Jolivet         if (D) {
1995*be705e3aSPierre Jolivet           ierr = MatConvert(D,MATBAIJ,MAT_INPLACE_MATRIX,&D);CHKERRQ(ierr);
1996*be705e3aSPierre Jolivet         } else {
1997*be705e3aSPierre Jolivet           ierr = MatConvert(B,MATBAIJ,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr);
1998*be705e3aSPierre Jolivet         }
1999*be705e3aSPierre Jolivet         B = D;
2000*be705e3aSPierre Jolivet       }
2001*be705e3aSPierre Jolivet       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2002*be705e3aSPierre Jolivet       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2003*be705e3aSPierre Jolivet       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2004*be705e3aSPierre Jolivet       for (br = 0; br < bm; ++br) {
2005*be705e3aSPierre Jolivet         PetscInt          row = bmindices[br], brncols, *cols;
2006*be705e3aSPierre Jolivet         const PetscInt    *brcols;
2007*be705e3aSPierre Jolivet         const PetscScalar *brcoldata;
2008*be705e3aSPierre Jolivet         PetscScalar       *vals = NULL;
2009*be705e3aSPierre Jolivet         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2010*be705e3aSPierre Jolivet         ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr);
2011*be705e3aSPierre Jolivet         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
2012*be705e3aSPierre Jolivet         /*
2013*be705e3aSPierre Jolivet           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
2014*be705e3aSPierre Jolivet           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
2015*be705e3aSPierre Jolivet          */
2016*be705e3aSPierre Jolivet         if (a != 1.0) {
2017*be705e3aSPierre Jolivet           ierr = PetscMalloc1(brncols,&vals);CHKERRQ(ierr);
2018*be705e3aSPierre Jolivet           for (k=0; k<brncols; k++) vals[k] = a * brcoldata[k];
2019*be705e3aSPierre Jolivet           ierr = MatSetValues(Y,1,&row,brncols,cols,vals,ADD_VALUES);CHKERRQ(ierr);
2020*be705e3aSPierre Jolivet           ierr = PetscFree(vals);CHKERRQ(ierr);
2021*be705e3aSPierre Jolivet         } else {
2022*be705e3aSPierre Jolivet           ierr = MatSetValues(Y,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr);
2023*be705e3aSPierre Jolivet         }
2024*be705e3aSPierre Jolivet         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2025*be705e3aSPierre Jolivet         ierr = PetscFree(cols);CHKERRQ(ierr);
2026*be705e3aSPierre Jolivet       }
2027*be705e3aSPierre Jolivet       if (D) {
2028*be705e3aSPierre Jolivet         ierr = MatDestroy(&D);
2029*be705e3aSPierre Jolivet       }
2030*be705e3aSPierre Jolivet       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2031*be705e3aSPierre Jolivet     }
2032*be705e3aSPierre Jolivet     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2033*be705e3aSPierre Jolivet     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
2034*be705e3aSPierre Jolivet   }
2035*be705e3aSPierre Jolivet   ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2036*be705e3aSPierre Jolivet   ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2037*be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2038*be705e3aSPierre Jolivet }
2039*be705e3aSPierre Jolivet 
2040*be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2041629c3df2SDmitry Karpeev {
2042629c3df2SDmitry Karpeev   PetscErrorCode ierr;
2043629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
2044*be705e3aSPierre Jolivet   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart,cstart,cend;
2045b68353e5Sstefano_zampini   PetscMPIInt    size;
2046629c3df2SDmitry Karpeev   Mat            C;
2047629c3df2SDmitry Karpeev 
2048629c3df2SDmitry Karpeev   PetscFunctionBegin;
2049ffc4695bSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRMPI(ierr);
2050b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
2051b68353e5Sstefano_zampini     PetscInt  nf;
2052b68353e5Sstefano_zampini     PetscBool fast;
2053b68353e5Sstefano_zampini 
2054b68353e5Sstefano_zampini     ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr);
2055b68353e5Sstefano_zampini     if (!fast) {
2056b68353e5Sstefano_zampini       ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr);
2057b68353e5Sstefano_zampini     }
2058b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
2059b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
2060b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
2061b68353e5Sstefano_zampini         if (B) {
2062b68353e5Sstefano_zampini           ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr);
206323875855Sstefano_zampini           if (!fast) {
206423875855Sstefano_zampini             PetscBool istrans;
206523875855Sstefano_zampini 
206623875855Sstefano_zampini             ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
206723875855Sstefano_zampini             if (istrans) {
206823875855Sstefano_zampini               Mat Bt;
206923875855Sstefano_zampini 
207023875855Sstefano_zampini               ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
207123875855Sstefano_zampini               ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr);
207223875855Sstefano_zampini             }
2073b68353e5Sstefano_zampini           }
2074b68353e5Sstefano_zampini         }
2075b68353e5Sstefano_zampini       }
2076b68353e5Sstefano_zampini     }
2077b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
2078b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr);
2079b68353e5Sstefano_zampini       if (fast) {
2080b68353e5Sstefano_zampini         PetscInt f,s;
2081b68353e5Sstefano_zampini 
2082b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr);
2083b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2084b68353e5Sstefano_zampini         else {
2085b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr);
2086b68353e5Sstefano_zampini           nf  += f;
2087b68353e5Sstefano_zampini         }
2088b68353e5Sstefano_zampini       }
2089b68353e5Sstefano_zampini     }
2090b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
2091b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr);
2092b68353e5Sstefano_zampini       if (fast) {
2093b68353e5Sstefano_zampini         PetscInt f,s;
2094b68353e5Sstefano_zampini 
2095b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr);
2096b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2097b68353e5Sstefano_zampini         else {
2098b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr);
2099b68353e5Sstefano_zampini           nf  += f;
2100b68353e5Sstefano_zampini         }
2101b68353e5Sstefano_zampini       }
2102b68353e5Sstefano_zampini     }
2103b68353e5Sstefano_zampini     if (fast) {
2104b68353e5Sstefano_zampini       ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr);
2105b68353e5Sstefano_zampini       PetscFunctionReturn(0);
2106b68353e5Sstefano_zampini     }
2107b68353e5Sstefano_zampini   }
2108629c3df2SDmitry Karpeev   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
2109629c3df2SDmitry Karpeev   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
2110649b366bSFande Kong   ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr);
2111629c3df2SDmitry Karpeev   switch (reuse) {
2112629c3df2SDmitry Karpeev   case MAT_INITIAL_MATRIX:
2113ce94432eSBarry Smith     ierr    = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
2114629c3df2SDmitry Karpeev     ierr    = MatSetType(C,newtype);CHKERRQ(ierr);
2115629c3df2SDmitry Karpeev     ierr    = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
2116629c3df2SDmitry Karpeev     *newmat = C;
2117629c3df2SDmitry Karpeev     break;
2118629c3df2SDmitry Karpeev   case MAT_REUSE_MATRIX:
2119629c3df2SDmitry Karpeev     C = *newmat;
2120629c3df2SDmitry Karpeev     break;
2121ce94432eSBarry Smith   default: SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MatReuse");
2122629c3df2SDmitry Karpeev   }
2123785e854fSJed Brown   ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr);
2124629c3df2SDmitry Karpeev   onnz = dnnz + m;
2125629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
2126629c3df2SDmitry Karpeev     dnnz[k] = 0;
2127629c3df2SDmitry Karpeev     onnz[k] = 0;
2128629c3df2SDmitry Karpeev   }
2129629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
2130629c3df2SDmitry Karpeev     IS             bNis;
2131629c3df2SDmitry Karpeev     PetscInt       bN;
2132629c3df2SDmitry Karpeev     const PetscInt *bNindices;
2133629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
2134629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
2135629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr);
2136629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2137629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2138629c3df2SDmitry Karpeev       PetscSF        bmsf;
2139649b366bSFande Kong       PetscSFNode    *iremote;
2140629c3df2SDmitry Karpeev       Mat            B;
2141649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
2142629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2143629c3df2SDmitry Karpeev       B = nest->m[i][j];
2144629c3df2SDmitry Karpeev       if (!B) continue;
2145629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2146629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2147ce94432eSBarry Smith       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr);
2148649b366bSFande Kong       ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr);
2149649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr);
2150649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr);
2151649b366bSFande Kong       for (k = 0; k < bm; ++k){
2152649b366bSFande Kong         sub_dnnz[k] = 0;
2153649b366bSFande Kong         sub_onnz[k] = 0;
2154649b366bSFande Kong       }
2155629c3df2SDmitry Karpeev       /*
2156629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
2157629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
2158629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
2159629c3df2SDmitry Karpeev        */
216083b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2161629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2162131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
2163629c3df2SDmitry Karpeev         const PetscInt *brcols;
2164a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
2165131c27b5Sprj-         PetscMPIInt    rowowner = 0;
2166629c3df2SDmitry Karpeev         ierr      = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr);
2167649b366bSFande Kong         /* how many roots  */
2168649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
2169649b366bSFande Kong         /* get nonzero pattern */
217083b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2171629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
2172629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
2173649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
2174649b366bSFande Kong             sub_dnnz[br]++;
2175649b366bSFande Kong           } else {
2176649b366bSFande Kong             sub_onnz[br]++;
2177649b366bSFande Kong           }
2178629c3df2SDmitry Karpeev         }
217983b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2180629c3df2SDmitry Karpeev       }
2181629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2182629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
2183649b366bSFande Kong       ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr);
2184649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2185649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2186649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2187649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2188649b366bSFande Kong       ierr = PetscFree(sub_dnnz);CHKERRQ(ierr);
2189649b366bSFande Kong       ierr = PetscFree(sub_onnz);CHKERRQ(ierr);
2190629c3df2SDmitry Karpeev       ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr);
2191629c3df2SDmitry Karpeev     }
219222d28d08SBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2193629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
219465a4a0a3Sstefano_zampini   }
219565a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
219665a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
219765a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
219865a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
2199629c3df2SDmitry Karpeev   }
2200629c3df2SDmitry Karpeev   ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr);
2201629c3df2SDmitry Karpeev   ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr);
2202629c3df2SDmitry Karpeev   ierr = PetscFree(dnnz);CHKERRQ(ierr);
2203*be705e3aSPierre Jolivet   ierr = MatAXPY_Dense_Nest(C,1.0,A);CHKERRQ(ierr);
2204*be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2205*be705e3aSPierre Jolivet }
2206629c3df2SDmitry Karpeev 
2207*be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_Dense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2208*be705e3aSPierre Jolivet {
2209629c3df2SDmitry Karpeev   Mat            B;
2210*be705e3aSPierre Jolivet   PetscInt       m,n,M,N;
2211*be705e3aSPierre Jolivet   PetscErrorCode ierr;
2212*be705e3aSPierre Jolivet 
2213*be705e3aSPierre Jolivet   PetscFunctionBegin;
2214*be705e3aSPierre Jolivet   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
2215*be705e3aSPierre Jolivet   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
2216*be705e3aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
2217*be705e3aSPierre Jolivet     B = *newmat;
2218*be705e3aSPierre Jolivet     ierr = MatZeroEntries(B);CHKERRQ(ierr);
2219*be705e3aSPierre Jolivet   } else {
2220*be705e3aSPierre Jolivet     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),m,PETSC_DECIDE,M,N,NULL,&B);CHKERRQ(ierr);
2221629c3df2SDmitry Karpeev   }
2222*be705e3aSPierre Jolivet   ierr = MatAXPY_Dense_Nest(B,1.0,A);CHKERRQ(ierr);
2223*be705e3aSPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) {
2224*be705e3aSPierre Jolivet     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
2225*be705e3aSPierre Jolivet   } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B;
2226629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
2227629c3df2SDmitry Karpeev }
2228629c3df2SDmitry Karpeev 
22298b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
22308b7d3b4bSBarry Smith {
22318b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
22323c6db4c4SPierre Jolivet   MatOperation   opAdd;
22338b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
22348b7d3b4bSBarry Smith   PetscBool      flg;
223552c5f739Sprj-   PetscErrorCode ierr;
223652c5f739Sprj-   PetscFunctionBegin;
22378b7d3b4bSBarry Smith 
223852c5f739Sprj-   *has = PETSC_FALSE;
22393c6db4c4SPierre Jolivet   if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) {
22403c6db4c4SPierre Jolivet     opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD);
22418b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
22428b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
22438b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
22443c6db4c4SPierre Jolivet         ierr = MatHasOperation(bA->m[i][j],opAdd,&flg);CHKERRQ(ierr);
22458b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
22468b7d3b4bSBarry Smith       }
22478b7d3b4bSBarry Smith     }
22488b7d3b4bSBarry Smith   }
22493c6db4c4SPierre Jolivet   if (((void**)mat->ops)[op]) *has = PETSC_TRUE;
22508b7d3b4bSBarry Smith   PetscFunctionReturn(0);
22518b7d3b4bSBarry Smith }
22528b7d3b4bSBarry Smith 
2253659c6bb0SJed Brown /*MC
2254659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
2255659c6bb0SJed Brown 
2256659c6bb0SJed Brown   Level: intermediate
2257659c6bb0SJed Brown 
2258659c6bb0SJed Brown   Notes:
2259659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
2260659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
2261950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
2262659c6bb0SJed Brown 
22638b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
22648b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
22658b7d3b4bSBarry Smith   than the nest matrix.
22668b7d3b4bSBarry Smith 
226779798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
226879798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
226979798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
2270659c6bb0SJed Brown M*/
22718cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
2272c8883902SJed Brown {
2273c8883902SJed Brown   Mat_Nest       *s;
2274c8883902SJed Brown   PetscErrorCode ierr;
2275c8883902SJed Brown 
2276c8883902SJed Brown   PetscFunctionBegin;
2277b00a9115SJed Brown   ierr    = PetscNewLog(A,&s);CHKERRQ(ierr);
2278c8883902SJed Brown   A->data = (void*)s;
2279e7c19651SJed Brown 
2280e7c19651SJed Brown   s->nr            = -1;
2281e7c19651SJed Brown   s->nc            = -1;
22820298fd71SBarry Smith   s->m             = NULL;
2283e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
2284c8883902SJed Brown 
2285c8883902SJed Brown   ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr);
228626fbe8dcSKarl Rupp 
2287c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
22889194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2289c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
22909194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2291f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2292c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2293c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2294c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2295c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
22966e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2297c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
22987dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2299c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2300c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2301f4259b30SLisandro Dalcin   A->ops->getvecs               = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2302c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2303c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2304429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2305429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2306a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2307a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
230813135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2309f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
23108b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2311381b8e50SStefano Zampini   A->ops->missingdiagonal       = MatMissingDiagonal_Nest;
2312c8883902SJed Brown 
2313f4259b30SLisandro Dalcin   A->spptr        = NULL;
2314c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2315c8883902SJed Brown 
2316c8883902SJed Brown   /* expose Nest api's */
2317bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest);CHKERRQ(ierr);
2318bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest);CHKERRQ(ierr);
2319bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest);CHKERRQ(ierr);
2320bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest);CHKERRQ(ierr);
2321bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest);CHKERRQ(ierr);
2322bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest);CHKERRQ(ierr);
2323bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest);CHKERRQ(ierr);
2324bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest);CHKERRQ(ierr);
23250899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
23260899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
232783b1a929SMark Adams   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ);CHKERRQ(ierr);
23285e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS);CHKERRQ(ierr);
2329*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",MatConvert_Nest_Dense);CHKERRQ(ierr);
2330*be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",MatConvert_Nest_Dense);CHKERRQ(ierr);
23314222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
23324222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
23334222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
2334c8883902SJed Brown 
2335c8883902SJed Brown   ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr);
2336c8883902SJed Brown   PetscFunctionReturn(0);
2337c8883902SJed Brown }
2338