xref: /petsc/src/mat/impls/nest/matnest.c (revision 0572eedc5607f0f5c0c0a7fff7b7d10242b3a0fe)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*);
706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat);
806a1af2fSStefano Zampini 
95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
10c8883902SJed Brown 
11d8588912SDave May /* private functions */
128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
13d8588912SDave May {
14d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
158188e55aSJed Brown   PetscInt       i,j;
16d8588912SDave May   PetscErrorCode ierr;
17d8588912SDave May 
18d8588912SDave May   PetscFunctionBegin;
198188e55aSJed Brown   *m = *n = *M = *N = 0;
208188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
218188e55aSJed Brown     PetscInt sm,sM;
228188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr);
238188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr);
248188e55aSJed Brown     *m  += sm;
258188e55aSJed Brown     *M  += sM;
26d8588912SDave May   }
278188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
288188e55aSJed Brown     PetscInt sn,sN;
298188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr);
308188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr);
318188e55aSJed Brown     *n  += sn;
328188e55aSJed Brown     *N  += sN;
33d8588912SDave May   }
34d8588912SDave May   PetscFunctionReturn(0);
35d8588912SDave May }
36d8588912SDave May 
37d8588912SDave May /* operations */
38207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
39d8588912SDave May {
40d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
41207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
42207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
43d8588912SDave May   PetscErrorCode ierr;
44d8588912SDave May 
45d8588912SDave May   PetscFunctionBegin;
46207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
47207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
48207556f9SJed Brown   for (i=0; i<nr; i++) {
49d8588912SDave May     ierr = VecZeroEntries(by[i]);CHKERRQ(ierr);
50207556f9SJed Brown     for (j=0; j<nc; j++) {
51207556f9SJed Brown       if (!bA->m[i][j]) continue;
52d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
53d8588912SDave May       ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr);
54d8588912SDave May     }
55d8588912SDave May   }
56207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
57207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
58d8588912SDave May   PetscFunctionReturn(0);
59d8588912SDave May }
60d8588912SDave May 
619194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
629194d70fSJed Brown {
639194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
649194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
659194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
669194d70fSJed Brown   PetscErrorCode ierr;
679194d70fSJed Brown 
689194d70fSJed Brown   PetscFunctionBegin;
699194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
709194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
719194d70fSJed Brown   for (i=0; i<nr; i++) {
729194d70fSJed Brown     if (y != z) {
739194d70fSJed Brown       Vec by;
749194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
759194d70fSJed Brown       ierr = VecCopy(by,bz[i]);CHKERRQ(ierr);
76336d21e7SJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
779194d70fSJed Brown     }
789194d70fSJed Brown     for (j=0; j<nc; j++) {
799194d70fSJed Brown       if (!bA->m[i][j]) continue;
809194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
819194d70fSJed Brown       ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr);
829194d70fSJed Brown     }
839194d70fSJed Brown   }
849194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
859194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
869194d70fSJed Brown   PetscFunctionReturn(0);
879194d70fSJed Brown }
889194d70fSJed Brown 
8952c5f739Sprj- typedef struct {
9052c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
9152c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
9252c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9352c5f739Sprj- } Nest_Dense;
9452c5f739Sprj- 
956718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C)
9652c5f739Sprj- {
976718818eSStefano Zampini   Mat_Nest          *bA;
9852c5f739Sprj-   Nest_Dense        *contents;
996718818eSStefano Zampini   Mat               viewB,viewC,productB,workC;
10052c5f739Sprj-   const PetscScalar *barray;
10152c5f739Sprj-   PetscScalar       *carray;
1026718818eSStefano Zampini   PetscInt          i,j,M,N,nr,nc,ldb,ldc;
10352c5f739Sprj-   PetscErrorCode    ierr;
1046718818eSStefano Zampini   Mat               A,B;
10552c5f739Sprj- 
10652c5f739Sprj-   PetscFunctionBegin;
1076718818eSStefano Zampini   MatCheckProduct(C,3);
1086718818eSStefano Zampini   A    = C->product->A;
1096718818eSStefano Zampini   B    = C->product->B;
1106718818eSStefano Zampini   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
1116718818eSStefano Zampini   if (!N) {
1126718818eSStefano Zampini     ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1136718818eSStefano Zampini     ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1146718818eSStefano Zampini     PetscFunctionReturn(0);
1156718818eSStefano Zampini   }
1166718818eSStefano Zampini   contents = (Nest_Dense*)C->product->data;
1176718818eSStefano Zampini   if (!contents) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty");
1186718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1196718818eSStefano Zampini   nr   = bA->nr;
1206718818eSStefano Zampini   nc   = bA->nc;
12152c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
12252c5f739Sprj-   ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr);
12352c5f739Sprj-   ierr = MatZeroEntries(C);CHKERRQ(ierr);
12452c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
1256718818eSStefano Zampini   ierr = MatDenseGetArrayWrite(C,&carray);CHKERRQ(ierr);
12652c5f739Sprj-   for (i=0; i<nr; i++) {
12752c5f739Sprj-     ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr);
12852c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr);
1296718818eSStefano Zampini     ierr = MatDenseSetLDA(viewC,ldc);CHKERRQ(ierr);
13052c5f739Sprj-     for (j=0; j<nc; j++) {
13152c5f739Sprj-       if (!bA->m[i][j]) continue;
13252c5f739Sprj-       ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
13352c5f739Sprj-       ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
1346718818eSStefano Zampini       ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
1354222ddf1SHong Zhang 
1364222ddf1SHong Zhang       /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */
1374222ddf1SHong Zhang       workC             = contents->workC[i*nc + j];
1384222ddf1SHong Zhang       productB          = workC->product->B;
1394222ddf1SHong Zhang       workC->product->B = viewB; /* use newly created dense matrix viewB */
1406718818eSStefano Zampini       ierr = MatProductNumeric(workC);CHKERRQ(ierr);
14152c5f739Sprj-       ierr = MatDestroy(&viewB);CHKERRQ(ierr);
1424222ddf1SHong Zhang       workC->product->B = productB; /* resume original B */
1434222ddf1SHong Zhang 
14452c5f739Sprj-       /* C[i] <- workC + C[i] */
14552c5f739Sprj-       ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr);
14652c5f739Sprj-     }
14752c5f739Sprj-     ierr = MatDestroy(&viewC);CHKERRQ(ierr);
14852c5f739Sprj-   }
1496718818eSStefano Zampini   ierr = MatDenseRestoreArrayWrite(C,&carray);CHKERRQ(ierr);
15052c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
1514222ddf1SHong Zhang 
1524222ddf1SHong Zhang   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1534222ddf1SHong Zhang   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15452c5f739Sprj-   PetscFunctionReturn(0);
15552c5f739Sprj- }
15652c5f739Sprj- 
15752c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
15852c5f739Sprj- {
15952c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
16052c5f739Sprj-   PetscInt       i;
16152c5f739Sprj-   PetscErrorCode ierr;
16252c5f739Sprj- 
16352c5f739Sprj-   PetscFunctionBegin;
16452c5f739Sprj-   ierr = PetscFree(contents->tarray);CHKERRQ(ierr);
16552c5f739Sprj-   for (i=0; i<contents->k; i++) {
16652c5f739Sprj-     ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr);
16752c5f739Sprj-   }
16852c5f739Sprj-   ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr);
16952c5f739Sprj-   ierr = PetscFree(contents);CHKERRQ(ierr);
17052c5f739Sprj-   PetscFunctionReturn(0);
17152c5f739Sprj- }
17252c5f739Sprj- 
1736718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C)
17452c5f739Sprj- {
1756718818eSStefano Zampini   Mat_Nest          *bA;
1766718818eSStefano Zampini   Mat               viewB,workC;
17752c5f739Sprj-   const PetscScalar *barray;
1786718818eSStefano Zampini   PetscInt          i,j,M,N,m,n,nr,nc,maxm = 0,ldb;
1794222ddf1SHong Zhang   Nest_Dense        *contents=NULL;
1806718818eSStefano Zampini   PetscBool         cisdense;
18152c5f739Sprj-   PetscErrorCode    ierr;
1826718818eSStefano Zampini   Mat               A,B;
1836718818eSStefano Zampini   PetscReal         fill;
18452c5f739Sprj- 
18552c5f739Sprj-   PetscFunctionBegin;
1866718818eSStefano Zampini   MatCheckProduct(C,4);
1876718818eSStefano Zampini   if (C->product->data) SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty");
1886718818eSStefano Zampini   A    = C->product->A;
1896718818eSStefano Zampini   B    = C->product->B;
1906718818eSStefano Zampini   fill = C->product->fill;
1916718818eSStefano Zampini   bA   = (Mat_Nest*)A->data;
1926718818eSStefano Zampini   nr   = bA->nr;
1936718818eSStefano Zampini   nc   = bA->nc;
194*0572eedcSPierre Jolivet   ierr = MatGetLocalSize(C,&m,&n);CHKERRQ(ierr);
195*0572eedcSPierre Jolivet   ierr = MatGetSize(C,&M,&N);CHKERRQ(ierr);
196*0572eedcSPierre Jolivet   if (m == PETSC_DECIDE || n == PETSC_DECIDE || M == PETSC_DECIDE || N == PETSC_DECIDE) {
1976718818eSStefano Zampini     ierr = MatGetLocalSize(B,NULL,&n);CHKERRQ(ierr);
19852c5f739Sprj-     ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
19952c5f739Sprj-     ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr);
20052c5f739Sprj-     ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr);
2016718818eSStefano Zampini     ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
202*0572eedcSPierre Jolivet   }
2036718818eSStefano Zampini   ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,"");CHKERRQ(ierr);
2046718818eSStefano Zampini   if (!cisdense) {
2056718818eSStefano Zampini     ierr = MatSetType(C,((PetscObject)B)->type_name);CHKERRQ(ierr);
2066718818eSStefano Zampini   }
20718992e5dSStefano Zampini   ierr = MatSetUp(C);CHKERRQ(ierr);
2086718818eSStefano Zampini   if (!N) {
2096718818eSStefano Zampini     C->ops->productnumeric = MatProductNumeric_Nest_Dense;
2106718818eSStefano Zampini     PetscFunctionReturn(0);
21152c5f739Sprj-   }
21252c5f739Sprj- 
21352c5f739Sprj-   ierr = PetscNew(&contents);CHKERRQ(ierr);
2146718818eSStefano Zampini   C->product->data = contents;
2156718818eSStefano Zampini   C->product->destroy = MatNest_DenseDestroy;
21652c5f739Sprj-   ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr);
21752c5f739Sprj-   contents->k = nr*nc;
21852c5f739Sprj-   for (i=0; i<nr; i++) {
21952c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr);
22052c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
22152c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
22252c5f739Sprj-   }
22352c5f739Sprj-   for (i=0; i<nc; i++) {
22452c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr);
22552c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
22652c5f739Sprj-   }
22752c5f739Sprj-   ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr);
22852c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
22952c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
23052c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
23152c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
23252c5f739Sprj-   for (j=0; j<nc; j++) {
23352c5f739Sprj-     ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
23452c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
2356718818eSStefano Zampini     ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr);
23652c5f739Sprj-     for (i=0; i<nr; i++) {
23752c5f739Sprj-       if (!bA->m[i][j]) continue;
23852c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
2394222ddf1SHong Zhang 
2404222ddf1SHong Zhang       ierr = MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]);CHKERRQ(ierr);
2414222ddf1SHong Zhang       workC = contents->workC[i*nc + j];
2424222ddf1SHong Zhang       ierr = MatProductSetType(workC,MATPRODUCT_AB);CHKERRQ(ierr);
2434222ddf1SHong Zhang       ierr = MatProductSetAlgorithm(workC,"default");CHKERRQ(ierr);
2444222ddf1SHong Zhang       ierr = MatProductSetFill(workC,fill);CHKERRQ(ierr);
2454222ddf1SHong Zhang       ierr = MatProductSetFromOptions(workC);CHKERRQ(ierr);
2464222ddf1SHong Zhang       ierr = MatProductSymbolic(workC);CHKERRQ(ierr);
2474222ddf1SHong Zhang 
2486718818eSStefano Zampini       /* since tarray will be shared by all Mat */
2496718818eSStefano Zampini       ierr = MatSeqDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
2506718818eSStefano Zampini       ierr = MatMPIDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr);
25152c5f739Sprj-     }
25252c5f739Sprj-     ierr = MatDestroy(&viewB);CHKERRQ(ierr);
25352c5f739Sprj-   }
25452c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
25552c5f739Sprj- 
2566718818eSStefano Zampini   C->ops->productnumeric = MatProductNumeric_Nest_Dense;
25752c5f739Sprj-   PetscFunctionReturn(0);
25852c5f739Sprj- }
25952c5f739Sprj- 
2604222ddf1SHong Zhang /* --------------------------------------------------------- */
2614222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C)
2624222ddf1SHong Zhang {
2634222ddf1SHong Zhang   PetscFunctionBegin;
2646718818eSStefano Zampini   C->ops->productsymbolic = MatProductSymbolic_Nest_Dense;
2654222ddf1SHong Zhang   PetscFunctionReturn(0);
2664222ddf1SHong Zhang }
2674222ddf1SHong Zhang 
2684222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C)
26952c5f739Sprj- {
27052c5f739Sprj-   PetscErrorCode ierr;
2714222ddf1SHong Zhang   Mat_Product    *product = C->product;
27252c5f739Sprj- 
27352c5f739Sprj-   PetscFunctionBegin;
2744222ddf1SHong Zhang   if (product->type == MATPRODUCT_AB) {
2754222ddf1SHong Zhang     ierr = MatProductSetFromOptions_Nest_Dense_AB(C);CHKERRQ(ierr);
2766718818eSStefano Zampini   }
27752c5f739Sprj-   PetscFunctionReturn(0);
27852c5f739Sprj- }
2794222ddf1SHong Zhang /* --------------------------------------------------------- */
28052c5f739Sprj- 
281207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
282d8588912SDave May {
283d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
284207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
285207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
286d8588912SDave May   PetscErrorCode ierr;
287d8588912SDave May 
288d8588912SDave May   PetscFunctionBegin;
289609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
290609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
291207556f9SJed Brown   for (j=0; j<nc; j++) {
292609e31cbSJed Brown     ierr = VecZeroEntries(by[j]);CHKERRQ(ierr);
293609e31cbSJed Brown     for (i=0; i<nr; i++) {
2946c75ac25SJed Brown       if (!bA->m[i][j]) continue;
295609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
296609e31cbSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr);
297d8588912SDave May     }
298d8588912SDave May   }
299609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
300609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
301d8588912SDave May   PetscFunctionReturn(0);
302d8588912SDave May }
303d8588912SDave May 
3049194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
3059194d70fSJed Brown {
3069194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
3079194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
3089194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
3099194d70fSJed Brown   PetscErrorCode ierr;
3109194d70fSJed Brown 
3119194d70fSJed Brown   PetscFunctionBegin;
3129194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3139194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3149194d70fSJed Brown   for (j=0; j<nc; j++) {
3159194d70fSJed Brown     if (y != z) {
3169194d70fSJed Brown       Vec by;
3179194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3189194d70fSJed Brown       ierr = VecCopy(by,bz[j]);CHKERRQ(ierr);
3199194d70fSJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
3209194d70fSJed Brown     }
3219194d70fSJed Brown     for (i=0; i<nr; i++) {
3226c75ac25SJed Brown       if (!bA->m[i][j]) continue;
3239194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
3249194d70fSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr);
3259194d70fSJed Brown     }
3269194d70fSJed Brown   }
3279194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
3289194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
3299194d70fSJed Brown   PetscFunctionReturn(0);
3309194d70fSJed Brown }
3319194d70fSJed Brown 
332f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
333f8170845SAlex Fikl {
334f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
335f8170845SAlex Fikl   Mat            C;
336f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
337f8170845SAlex Fikl   PetscErrorCode ierr;
338f8170845SAlex Fikl 
339f8170845SAlex Fikl   PetscFunctionBegin;
340cf37664fSBarry Smith   if (reuse == MAT_INPLACE_MATRIX && nr != nc) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
341f8170845SAlex Fikl 
342cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
343f8170845SAlex Fikl     Mat *subs;
344f8170845SAlex Fikl     IS  *is_row,*is_col;
345f8170845SAlex Fikl 
346f8170845SAlex Fikl     ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr);
347f8170845SAlex Fikl     ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr);
348f8170845SAlex Fikl     ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr);
349cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
350ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
351ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
352ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
353ddeb9bd8SAlex Fikl         }
354ddeb9bd8SAlex Fikl       }
355ddeb9bd8SAlex Fikl     }
356ddeb9bd8SAlex Fikl 
357f8170845SAlex Fikl     ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr);
358f8170845SAlex Fikl     ierr = PetscFree(subs);CHKERRQ(ierr);
3593d994f23SBarry Smith     ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr);
360f8170845SAlex Fikl   } else {
361f8170845SAlex Fikl     C = *B;
362f8170845SAlex Fikl   }
363f8170845SAlex Fikl 
364f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
365f8170845SAlex Fikl   for (i=0; i<nr; i++) {
366f8170845SAlex Fikl     for (j=0; j<nc; j++) {
367f8170845SAlex Fikl       if (bA->m[i][j]) {
368f8170845SAlex Fikl         ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr);
369f8170845SAlex Fikl       } else {
370f8170845SAlex Fikl         bC->m[j][i] = NULL;
371f8170845SAlex Fikl       }
372f8170845SAlex Fikl     }
373f8170845SAlex Fikl   }
374f8170845SAlex Fikl 
375cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
376f8170845SAlex Fikl     *B = C;
377f8170845SAlex Fikl   } else {
378f8170845SAlex Fikl     ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr);
379f8170845SAlex Fikl   }
380f8170845SAlex Fikl   PetscFunctionReturn(0);
381f8170845SAlex Fikl }
382f8170845SAlex Fikl 
383e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
384e2d7f03fSJed Brown {
385e2d7f03fSJed Brown   PetscErrorCode ierr;
386e2d7f03fSJed Brown   IS             *lst = *list;
387e2d7f03fSJed Brown   PetscInt       i;
388e2d7f03fSJed Brown 
389e2d7f03fSJed Brown   PetscFunctionBegin;
390e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3916bf464f9SBarry Smith   for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);}
392e2d7f03fSJed Brown   ierr  = PetscFree(lst);CHKERRQ(ierr);
3930298fd71SBarry Smith   *list = NULL;
394e2d7f03fSJed Brown   PetscFunctionReturn(0);
395e2d7f03fSJed Brown }
396e2d7f03fSJed Brown 
39706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A)
398d8588912SDave May {
399d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
400d8588912SDave May   PetscInt       i,j;
401d8588912SDave May   PetscErrorCode ierr;
402d8588912SDave May 
403d8588912SDave May   PetscFunctionBegin;
404d8588912SDave May   /* release the matrices and the place holders */
405e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr);
406e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr);
407e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
408e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
409d8588912SDave May 
410d8588912SDave May   ierr = PetscFree(vs->row_len);CHKERRQ(ierr);
411d8588912SDave May   ierr = PetscFree(vs->col_len);CHKERRQ(ierr);
41206a1af2fSStefano Zampini   ierr = PetscFree(vs->nnzstate);CHKERRQ(ierr);
413d8588912SDave May 
414207556f9SJed Brown   ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr);
415207556f9SJed Brown 
416d8588912SDave May   /* release the matrices and the place holders */
417d8588912SDave May   if (vs->m) {
418d8588912SDave May     for (i=0; i<vs->nr; i++) {
419d8588912SDave May       for (j=0; j<vs->nc; j++) {
4206bf464f9SBarry Smith         ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr);
421d8588912SDave May       }
422d8588912SDave May       ierr = PetscFree(vs->m[i]);CHKERRQ(ierr);
423d8588912SDave May     }
424d8588912SDave May     ierr = PetscFree(vs->m);CHKERRQ(ierr);
425d8588912SDave May   }
42606a1af2fSStefano Zampini 
42706a1af2fSStefano Zampini   /* restore defaults */
42806a1af2fSStefano Zampini   vs->nr = 0;
42906a1af2fSStefano Zampini   vs->nc = 0;
43006a1af2fSStefano Zampini   vs->splitassembly = PETSC_FALSE;
43106a1af2fSStefano Zampini   PetscFunctionReturn(0);
43206a1af2fSStefano Zampini }
43306a1af2fSStefano Zampini 
43406a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A)
43506a1af2fSStefano Zampini {
43606a1af2fSStefano Zampini   PetscErrorCode ierr;
43706a1af2fSStefano Zampini 
43806a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
439bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
440d8588912SDave May 
441be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",NULL);CHKERRQ(ierr);
442be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",NULL);CHKERRQ(ierr);
443be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",NULL);CHKERRQ(ierr);
444be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",NULL);CHKERRQ(ierr);
445be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",NULL);CHKERRQ(ierr);
446be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",NULL);CHKERRQ(ierr);
447be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",NULL);CHKERRQ(ierr);
448be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",NULL);CHKERRQ(ierr);
449be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",NULL);CHKERRQ(ierr);
450be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",NULL);CHKERRQ(ierr);
451be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",NULL);CHKERRQ(ierr);
452be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",NULL);CHKERRQ(ierr);
453be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",NULL);CHKERRQ(ierr);
454be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",NULL);CHKERRQ(ierr);
4554222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL);CHKERRQ(ierr);
4564222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL);CHKERRQ(ierr);
4574222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL);CHKERRQ(ierr);
458d8588912SDave May   PetscFunctionReturn(0);
459d8588912SDave May }
460d8588912SDave May 
461381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd)
462381b8e50SStefano Zampini {
463381b8e50SStefano Zampini   Mat_Nest       *vs = (Mat_Nest*)mat->data;
464381b8e50SStefano Zampini   PetscInt       i;
465381b8e50SStefano Zampini   PetscErrorCode ierr;
466381b8e50SStefano Zampini 
467381b8e50SStefano Zampini   PetscFunctionBegin;
468381b8e50SStefano Zampini   if (dd) *dd = 0;
469381b8e50SStefano Zampini   if (!vs->nr) {
470381b8e50SStefano Zampini     *missing = PETSC_TRUE;
471381b8e50SStefano Zampini     PetscFunctionReturn(0);
472381b8e50SStefano Zampini   }
473381b8e50SStefano Zampini   *missing = PETSC_FALSE;
474381b8e50SStefano Zampini   for (i = 0; i < vs->nr && !(*missing); i++) {
475381b8e50SStefano Zampini     *missing = PETSC_TRUE;
476381b8e50SStefano Zampini     if (vs->m[i][i]) {
477381b8e50SStefano Zampini       ierr = MatMissingDiagonal(vs->m[i][i],missing,NULL);CHKERRQ(ierr);
478381b8e50SStefano Zampini       if (*missing && dd) SETERRQ(PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented");
479381b8e50SStefano Zampini     }
480381b8e50SStefano Zampini   }
481381b8e50SStefano Zampini   PetscFunctionReturn(0);
482381b8e50SStefano Zampini }
483381b8e50SStefano Zampini 
484207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
485d8588912SDave May {
486d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
487d8588912SDave May   PetscInt       i,j;
488d8588912SDave May   PetscErrorCode ierr;
48906a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
490d8588912SDave May 
491d8588912SDave May   PetscFunctionBegin;
492d8588912SDave May   for (i=0; i<vs->nr; i++) {
493d8588912SDave May     for (j=0; j<vs->nc; j++) {
49406a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
495e7c19651SJed Brown       if (vs->m[i][j]) {
496e7c19651SJed Brown         ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr);
497e7c19651SJed Brown         if (!vs->splitassembly) {
498e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
499e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
500e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
501e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
502e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
503e7c19651SJed Brown            */
504e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
50506a1af2fSStefano Zampini           ierr = MatGetNonzeroState(vs->m[i][j],&subnnzstate);CHKERRQ(ierr);
506e7c19651SJed Brown         }
507e7c19651SJed Brown       }
50806a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate);
50906a1af2fSStefano Zampini       vs->nnzstate[i*vs->nc+j] = subnnzstate;
510d8588912SDave May     }
511d8588912SDave May   }
51206a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
513d8588912SDave May   PetscFunctionReturn(0);
514d8588912SDave May }
515d8588912SDave May 
516207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
517d8588912SDave May {
518d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
519d8588912SDave May   PetscInt       i,j;
520d8588912SDave May   PetscErrorCode ierr;
521d8588912SDave May 
522d8588912SDave May   PetscFunctionBegin;
523d8588912SDave May   for (i=0; i<vs->nr; i++) {
524d8588912SDave May     for (j=0; j<vs->nc; j++) {
525e7c19651SJed Brown       if (vs->m[i][j]) {
526e7c19651SJed Brown         if (vs->splitassembly) {
527e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
528e7c19651SJed Brown         }
529e7c19651SJed Brown       }
530d8588912SDave May     }
531d8588912SDave May   }
532d8588912SDave May   PetscFunctionReturn(0);
533d8588912SDave May }
534d8588912SDave May 
535f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
536d8588912SDave May {
537207556f9SJed Brown   PetscErrorCode ierr;
538f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
539f349c1fdSJed Brown   PetscInt       j;
540f349c1fdSJed Brown   Mat            sub;
541d8588912SDave May 
542d8588912SDave May   PetscFunctionBegin;
5430298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
544f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
5454994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
546f349c1fdSJed Brown   *B = sub;
547f349c1fdSJed Brown   PetscFunctionReturn(0);
548d8588912SDave May }
549d8588912SDave May 
550f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
551f349c1fdSJed Brown {
552207556f9SJed Brown   PetscErrorCode ierr;
553f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
554f349c1fdSJed Brown   PetscInt       i;
555f349c1fdSJed Brown   Mat            sub;
556f349c1fdSJed Brown 
557f349c1fdSJed Brown   PetscFunctionBegin;
5580298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
559f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
5604994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
561f349c1fdSJed Brown   *B = sub;
562f349c1fdSJed Brown   PetscFunctionReturn(0);
563d8588912SDave May }
564d8588912SDave May 
56518d228c0SPierre Jolivet static PetscErrorCode MatNestFindISRange(Mat A,PetscInt n,const IS list[],IS is,PetscInt *begin,PetscInt *end)
566f349c1fdSJed Brown {
56718d228c0SPierre Jolivet   PetscInt       i,j,size,m;
568f349c1fdSJed Brown   PetscBool      flg;
56918d228c0SPierre Jolivet   IS             out,concatenate[2];
57018d228c0SPierre Jolivet   PetscErrorCode ierr;
571f349c1fdSJed Brown 
572f349c1fdSJed Brown   PetscFunctionBegin;
573f349c1fdSJed Brown   PetscValidPointer(list,3);
574f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
57518d228c0SPierre Jolivet   if (begin) {
57618d228c0SPierre Jolivet     PetscValidIntPointer(begin,5);
57718d228c0SPierre Jolivet     *begin = -1;
57818d228c0SPierre Jolivet   }
57918d228c0SPierre Jolivet   if (end) {
58018d228c0SPierre Jolivet     PetscValidIntPointer(end,6);
58118d228c0SPierre Jolivet     *end = -1;
58218d228c0SPierre Jolivet   }
583f349c1fdSJed Brown   for (i=0; i<n; i++) {
584207556f9SJed Brown     if (!list[i]) continue;
585320466b0SStefano Zampini     ierr = ISEqualUnsorted(list[i],is,&flg);CHKERRQ(ierr);
586f349c1fdSJed Brown     if (flg) {
58718d228c0SPierre Jolivet       if (begin) *begin = i;
58818d228c0SPierre Jolivet       if (end) *end = i+1;
589f349c1fdSJed Brown       PetscFunctionReturn(0);
590f349c1fdSJed Brown     }
591f349c1fdSJed Brown   }
59218d228c0SPierre Jolivet   ierr = ISGetSize(is,&size);CHKERRQ(ierr);
59318d228c0SPierre Jolivet   for (i=0; i<n-1; i++) {
59418d228c0SPierre Jolivet     if (!list[i]) continue;
59518d228c0SPierre Jolivet     m = 0;
59618d228c0SPierre Jolivet     ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,list+i,&out);CHKERRQ(ierr);
59718d228c0SPierre Jolivet     ierr = ISGetSize(out,&m);CHKERRQ(ierr);
59818d228c0SPierre Jolivet     for (j=i+2; j<n && m<size; j++) {
59918d228c0SPierre Jolivet       if (list[j]) {
60018d228c0SPierre Jolivet         concatenate[0] = out;
60118d228c0SPierre Jolivet         concatenate[1] = list[j];
60218d228c0SPierre Jolivet         ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,concatenate,&out);CHKERRQ(ierr);
60318d228c0SPierre Jolivet         ierr = ISDestroy(concatenate);CHKERRQ(ierr);
60418d228c0SPierre Jolivet         ierr = ISGetSize(out,&m);CHKERRQ(ierr);
60518d228c0SPierre Jolivet       }
60618d228c0SPierre Jolivet     }
60718d228c0SPierre Jolivet     if (m == size) {
60818d228c0SPierre Jolivet       ierr = ISEqualUnsorted(out,is,&flg);CHKERRQ(ierr);
60918d228c0SPierre Jolivet       if (flg) {
61018d228c0SPierre Jolivet         if (begin) *begin = i;
61118d228c0SPierre Jolivet         if (end) *end = j;
61218d228c0SPierre Jolivet         ierr = ISDestroy(&out);CHKERRQ(ierr);
61318d228c0SPierre Jolivet         PetscFunctionReturn(0);
61418d228c0SPierre Jolivet       }
61518d228c0SPierre Jolivet     }
61618d228c0SPierre Jolivet     ierr = ISDestroy(&out);CHKERRQ(ierr);
61718d228c0SPierre Jolivet   }
61818d228c0SPierre Jolivet   PetscFunctionReturn(0);
619f349c1fdSJed Brown }
620f349c1fdSJed Brown 
62118d228c0SPierre Jolivet 
62218d228c0SPierre Jolivet static PetscErrorCode MatNestFillEmptyMat_Private(Mat A,PetscInt i,PetscInt j,Mat *B)
6238188e55aSJed Brown {
6248188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
62518d228c0SPierre Jolivet   PetscInt       lr,lc;
62618d228c0SPierre Jolivet   PetscErrorCode ierr;
62718d228c0SPierre Jolivet 
62818d228c0SPierre Jolivet   PetscFunctionBegin;
62918d228c0SPierre Jolivet   ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr);
63018d228c0SPierre Jolivet   ierr = ISGetLocalSize(vs->isglobal.row[i],&lr);CHKERRQ(ierr);
63118d228c0SPierre Jolivet   ierr = ISGetLocalSize(vs->isglobal.col[j],&lc);CHKERRQ(ierr);
63218d228c0SPierre Jolivet   ierr = MatSetSizes(*B,lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
63318d228c0SPierre Jolivet   ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr);
63418d228c0SPierre Jolivet   ierr = MatSeqAIJSetPreallocation(*B,0,NULL);CHKERRQ(ierr);
63518d228c0SPierre Jolivet   ierr = MatMPIAIJSetPreallocation(*B,0,NULL,0,NULL);CHKERRQ(ierr);
63618d228c0SPierre Jolivet   ierr = MatSetUp(*B);CHKERRQ(ierr);
63718d228c0SPierre Jolivet   ierr = MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
63818d228c0SPierre Jolivet   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
63918d228c0SPierre Jolivet   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
64018d228c0SPierre Jolivet   PetscFunctionReturn(0);
64118d228c0SPierre Jolivet }
64218d228c0SPierre Jolivet 
64318d228c0SPierre Jolivet static PetscErrorCode MatNestGetBlock_Private(Mat A,PetscInt rbegin,PetscInt rend,PetscInt cbegin,PetscInt cend,Mat *B)
64418d228c0SPierre Jolivet {
64518d228c0SPierre Jolivet   Mat_Nest       *vs = (Mat_Nest*)A->data;
64618d228c0SPierre Jolivet   Mat            *a;
64718d228c0SPierre Jolivet   PetscInt       i,j,k,l,nr=rend-rbegin,nc=cend-cbegin;
6488188e55aSJed Brown   char           keyname[256];
64918d228c0SPierre Jolivet   PetscBool      *b;
65018d228c0SPierre Jolivet   PetscBool      flg;
6518188e55aSJed Brown   PetscErrorCode ierr;
6528188e55aSJed Brown 
6538188e55aSJed Brown   PetscFunctionBegin;
6540298fd71SBarry Smith   *B   = NULL;
65518d228c0SPierre Jolivet   ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestBlock_%D-%Dx%D-%D",rbegin,rend,cbegin,cend);CHKERRQ(ierr);
6568188e55aSJed Brown   ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr);
6578188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
6588188e55aSJed Brown 
65918d228c0SPierre Jolivet   ierr = PetscMalloc2(nr*nc,&a,nr*nc,&b);CHKERRQ(ierr);
66018d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
66118d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
66218d228c0SPierre Jolivet       a[i*nc + j] = vs->m[rbegin+i][cbegin+j];
66318d228c0SPierre Jolivet       b[i*nc + j] = PETSC_FALSE;
66418d228c0SPierre Jolivet     }
66518d228c0SPierre Jolivet   }
66618d228c0SPierre Jolivet   if (nc!=vs->nc&&nr!=vs->nr) {
66718d228c0SPierre Jolivet     for (i=0; i<nr; i++) {
66818d228c0SPierre Jolivet       for (j=0; j<nc; j++) {
66918d228c0SPierre Jolivet         flg = PETSC_FALSE;
67018d228c0SPierre Jolivet         for (k=0; (k<nr&&!flg); k++) {
67118d228c0SPierre Jolivet           if (a[j + k*nc]) flg = PETSC_TRUE;
67218d228c0SPierre Jolivet         }
67318d228c0SPierre Jolivet         if (flg) {
67418d228c0SPierre Jolivet           flg = PETSC_FALSE;
67518d228c0SPierre Jolivet           for (l=0; (l<nc&&!flg); l++) {
67618d228c0SPierre Jolivet             if (a[i*nc + l]) flg = PETSC_TRUE;
67718d228c0SPierre Jolivet           }
67818d228c0SPierre Jolivet         }
67918d228c0SPierre Jolivet         if (!flg) {
68018d228c0SPierre Jolivet           b[i*nc + j] = PETSC_TRUE;
68118d228c0SPierre Jolivet           ierr = MatNestFillEmptyMat_Private(A,rbegin+i,cbegin+j,a + i*nc + j);CHKERRQ(ierr);
68218d228c0SPierre Jolivet         }
68318d228c0SPierre Jolivet       }
68418d228c0SPierre Jolivet     }
68518d228c0SPierre Jolivet   }
68618d228c0SPierre Jolivet   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,nr!=vs->nr?NULL:vs->isglobal.row,nc,nc!=vs->nc?NULL:vs->isglobal.col,a,B);CHKERRQ(ierr);
68718d228c0SPierre Jolivet   for (i=0; i<nr; i++) {
68818d228c0SPierre Jolivet     for (j=0; j<nc; j++) {
68918d228c0SPierre Jolivet       if (b[i*nc + j]) {
69018d228c0SPierre Jolivet         ierr = MatDestroy(a + i*nc + j);CHKERRQ(ierr);
69118d228c0SPierre Jolivet       }
69218d228c0SPierre Jolivet     }
69318d228c0SPierre Jolivet   }
69418d228c0SPierre Jolivet   ierr = PetscFree2(a,b);CHKERRQ(ierr);
6958188e55aSJed Brown   (*B)->assembled = A->assembled;
6968188e55aSJed Brown   ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr);
6978188e55aSJed Brown   ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */
6988188e55aSJed Brown   PetscFunctionReturn(0);
6998188e55aSJed Brown }
7008188e55aSJed Brown 
701f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
702f349c1fdSJed Brown {
703f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
70418d228c0SPierre Jolivet   PetscInt       rbegin,rend,cbegin,cend;
7058188e55aSJed Brown   PetscErrorCode ierr;
706f349c1fdSJed Brown 
707f349c1fdSJed Brown   PetscFunctionBegin;
70818d228c0SPierre Jolivet   ierr = MatNestFindISRange(A,vs->nr,is->row,isrow,&rbegin,&rend);CHKERRQ(ierr);
70918d228c0SPierre Jolivet   ierr = MatNestFindISRange(A,vs->nc,is->col,iscol,&cbegin,&cend);CHKERRQ(ierr);
71018d228c0SPierre Jolivet   if (rend == rbegin + 1 && cend == cbegin + 1) {
71118d228c0SPierre Jolivet     if (!vs->m[rbegin][cbegin]) {
71218d228c0SPierre Jolivet       ierr = MatNestFillEmptyMat_Private(A,rbegin,cbegin,vs->m[rbegin] + cbegin);CHKERRQ(ierr);
71377019fcaSJed Brown     }
71418d228c0SPierre Jolivet     *B = vs->m[rbegin][cbegin];
71518d228c0SPierre Jolivet   } else if (rbegin != -1 && cbegin != -1) {
71618d228c0SPierre Jolivet     ierr = MatNestGetBlock_Private(A,rbegin,rend,cbegin,cend,B);CHKERRQ(ierr);
71718d228c0SPierre Jolivet   } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
718f349c1fdSJed Brown   PetscFunctionReturn(0);
719f349c1fdSJed Brown }
720f349c1fdSJed Brown 
72106a1af2fSStefano Zampini /*
72206a1af2fSStefano Zampini    TODO: This does not actually returns a submatrix we can modify
72306a1af2fSStefano Zampini */
7247dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
725f349c1fdSJed Brown {
726f349c1fdSJed Brown   PetscErrorCode ierr;
727f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
728f349c1fdSJed Brown   Mat            sub;
729f349c1fdSJed Brown 
730f349c1fdSJed Brown   PetscFunctionBegin;
731f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr);
732f349c1fdSJed Brown   switch (reuse) {
733f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
7347874fa86SDave May     if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); }
735f349c1fdSJed Brown     *B = sub;
736f349c1fdSJed Brown     break;
737f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
738ce94432eSBarry Smith     if (sub != *B) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
739f349c1fdSJed Brown     break;
740f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
741f349c1fdSJed Brown     break;
742511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
743511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
744f349c1fdSJed Brown   }
745f349c1fdSJed Brown   PetscFunctionReturn(0);
746f349c1fdSJed Brown }
747f349c1fdSJed Brown 
748f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
749f349c1fdSJed Brown {
750f349c1fdSJed Brown   PetscErrorCode ierr;
751f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
752f349c1fdSJed Brown   Mat            sub;
753f349c1fdSJed Brown 
754f349c1fdSJed Brown   PetscFunctionBegin;
755f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
756f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
757f349c1fdSJed Brown   if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);}
758f349c1fdSJed Brown   *B = sub;
759d8588912SDave May   PetscFunctionReturn(0);
760d8588912SDave May }
761d8588912SDave May 
762207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
763d8588912SDave May {
764d8588912SDave May   PetscErrorCode ierr;
765f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
766f349c1fdSJed Brown   Mat            sub;
767d8588912SDave May 
768d8588912SDave May   PetscFunctionBegin;
769f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
770ce94432eSBarry Smith   if (*B != sub) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
771f349c1fdSJed Brown   if (sub) {
772ce94432eSBarry Smith     if (((PetscObject)sub)->refct <= 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
7736bf464f9SBarry Smith     ierr = MatDestroy(B);CHKERRQ(ierr);
774d8588912SDave May   }
775d8588912SDave May   PetscFunctionReturn(0);
776d8588912SDave May }
777d8588912SDave May 
7787874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
7797874fa86SDave May {
7807874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
7817874fa86SDave May   PetscInt       i;
7827874fa86SDave May   PetscErrorCode ierr;
7837874fa86SDave May 
7847874fa86SDave May   PetscFunctionBegin;
7857874fa86SDave May   for (i=0; i<bA->nr; i++) {
786429bac76SJed Brown     Vec bv;
787429bac76SJed Brown     ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7887874fa86SDave May     if (bA->m[i][i]) {
789429bac76SJed Brown       ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr);
7907874fa86SDave May     } else {
7915159a857SMatthew G. Knepley       ierr = VecSet(bv,0.0);CHKERRQ(ierr);
7927874fa86SDave May     }
793429bac76SJed Brown     ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
7947874fa86SDave May   }
7957874fa86SDave May   PetscFunctionReturn(0);
7967874fa86SDave May }
7977874fa86SDave May 
7987874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
7997874fa86SDave May {
8007874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
801429bac76SJed Brown   Vec            bl,*br;
8027874fa86SDave May   PetscInt       i,j;
8037874fa86SDave May   PetscErrorCode ierr;
8047874fa86SDave May 
8057874fa86SDave May   PetscFunctionBegin;
8063f800ebeSJed Brown   ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr);
8072e6472ebSElliott Sales de Andrade   if (r) {
808429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
8092e6472ebSElliott Sales de Andrade   }
8102e6472ebSElliott Sales de Andrade   bl = NULL;
8117874fa86SDave May   for (i=0; i<bA->nr; i++) {
8122e6472ebSElliott Sales de Andrade     if (l) {
813429bac76SJed Brown       ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
8142e6472ebSElliott Sales de Andrade     }
8157874fa86SDave May     for (j=0; j<bA->nc; j++) {
8167874fa86SDave May       if (bA->m[i][j]) {
817429bac76SJed Brown         ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr);
8187874fa86SDave May       }
8197874fa86SDave May     }
8202e6472ebSElliott Sales de Andrade     if (l) {
821a061e289SJed Brown       ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
8227874fa86SDave May     }
8232e6472ebSElliott Sales de Andrade   }
8242e6472ebSElliott Sales de Andrade   if (r) {
825429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
8262e6472ebSElliott Sales de Andrade   }
827429bac76SJed Brown   ierr = PetscFree(br);CHKERRQ(ierr);
8287874fa86SDave May   PetscFunctionReturn(0);
8297874fa86SDave May }
8307874fa86SDave May 
831a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
832a061e289SJed Brown {
833a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
834a061e289SJed Brown   PetscInt       i,j;
835a061e289SJed Brown   PetscErrorCode ierr;
836a061e289SJed Brown 
837a061e289SJed Brown   PetscFunctionBegin;
838a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
839a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
840a061e289SJed Brown       if (bA->m[i][j]) {
841a061e289SJed Brown         ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr);
842a061e289SJed Brown       }
843a061e289SJed Brown     }
844a061e289SJed Brown   }
845a061e289SJed Brown   PetscFunctionReturn(0);
846a061e289SJed Brown }
847a061e289SJed Brown 
848a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
849a061e289SJed Brown {
850a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
851a061e289SJed Brown   PetscInt       i;
852a061e289SJed Brown   PetscErrorCode ierr;
85306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
854a061e289SJed Brown 
855a061e289SJed Brown   PetscFunctionBegin;
856a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
85706a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
858ce94432eSBarry Smith     if (!bA->m[i][i]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%D,%D)",i,i);
859a061e289SJed Brown     ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr);
86006a1af2fSStefano Zampini     ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
86106a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
86206a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
863a061e289SJed Brown   }
86406a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
865a061e289SJed Brown   PetscFunctionReturn(0);
866a061e289SJed Brown }
867a061e289SJed Brown 
86813135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
86913135bc6SAlex Fikl {
87013135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
87113135bc6SAlex Fikl   PetscInt       i;
87213135bc6SAlex Fikl   PetscErrorCode ierr;
87306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
87413135bc6SAlex Fikl 
87513135bc6SAlex Fikl   PetscFunctionBegin;
87613135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
87706a1af2fSStefano Zampini     PetscObjectState subnnzstate = 0;
87813135bc6SAlex Fikl     Vec              bv;
87913135bc6SAlex Fikl     ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
88013135bc6SAlex Fikl     if (bA->m[i][i]) {
88113135bc6SAlex Fikl       ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr);
88206a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr);
88313135bc6SAlex Fikl     }
88413135bc6SAlex Fikl     ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
88506a1af2fSStefano Zampini     nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate);
88606a1af2fSStefano Zampini     bA->nnzstate[i*bA->nc+i] = subnnzstate;
88713135bc6SAlex Fikl   }
88806a1af2fSStefano Zampini   if (nnzstate) A->nonzerostate++;
88913135bc6SAlex Fikl   PetscFunctionReturn(0);
89013135bc6SAlex Fikl }
89113135bc6SAlex Fikl 
892f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
893f8170845SAlex Fikl {
894f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
895f8170845SAlex Fikl   PetscInt       i,j;
896f8170845SAlex Fikl   PetscErrorCode ierr;
897f8170845SAlex Fikl 
898f8170845SAlex Fikl   PetscFunctionBegin;
899f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
900f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
901f8170845SAlex Fikl       if (bA->m[i][j]) {
902f8170845SAlex Fikl         ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr);
903f8170845SAlex Fikl       }
904f8170845SAlex Fikl     }
905f8170845SAlex Fikl   }
906f8170845SAlex Fikl   PetscFunctionReturn(0);
907f8170845SAlex Fikl }
908f8170845SAlex Fikl 
9092a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
910d8588912SDave May {
911d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
912d8588912SDave May   Vec            *L,*R;
913d8588912SDave May   MPI_Comm       comm;
914d8588912SDave May   PetscInt       i,j;
915d8588912SDave May   PetscErrorCode ierr;
916d8588912SDave May 
917d8588912SDave May   PetscFunctionBegin;
918ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
919d8588912SDave May   if (right) {
920d8588912SDave May     /* allocate R */
921854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr);
922d8588912SDave May     /* Create the right vectors */
923d8588912SDave May     for (j=0; j<bA->nc; j++) {
924d8588912SDave May       for (i=0; i<bA->nr; i++) {
925d8588912SDave May         if (bA->m[i][j]) {
9262a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr);
927d8588912SDave May           break;
928d8588912SDave May         }
929d8588912SDave May       }
9306c4ed002SBarry Smith       if (i==bA->nr) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
931d8588912SDave May     }
932f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr);
933d8588912SDave May     /* hand back control to the nest vector */
934d8588912SDave May     for (j=0; j<bA->nc; j++) {
9356bf464f9SBarry Smith       ierr = VecDestroy(&R[j]);CHKERRQ(ierr);
936d8588912SDave May     }
937d8588912SDave May     ierr = PetscFree(R);CHKERRQ(ierr);
938d8588912SDave May   }
939d8588912SDave May 
940d8588912SDave May   if (left) {
941d8588912SDave May     /* allocate L */
942854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr);
943d8588912SDave May     /* Create the left vectors */
944d8588912SDave May     for (i=0; i<bA->nr; i++) {
945d8588912SDave May       for (j=0; j<bA->nc; j++) {
946d8588912SDave May         if (bA->m[i][j]) {
9472a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr);
948d8588912SDave May           break;
949d8588912SDave May         }
950d8588912SDave May       }
9516c4ed002SBarry Smith       if (j==bA->nc) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
952d8588912SDave May     }
953d8588912SDave May 
954f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr);
955d8588912SDave May     for (i=0; i<bA->nr; i++) {
9566bf464f9SBarry Smith       ierr = VecDestroy(&L[i]);CHKERRQ(ierr);
957d8588912SDave May     }
958d8588912SDave May 
959d8588912SDave May     ierr = PetscFree(L);CHKERRQ(ierr);
960d8588912SDave May   }
961d8588912SDave May   PetscFunctionReturn(0);
962d8588912SDave May }
963d8588912SDave May 
964207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
965d8588912SDave May {
966d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
96729e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
968d8588912SDave May   PetscInt       i,j;
969d8588912SDave May   PetscErrorCode ierr;
970d8588912SDave May 
971d8588912SDave May   PetscFunctionBegin;
972251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
973d8588912SDave May   if (isascii) {
974d8588912SDave May 
97529e60adbSStefano Zampini     ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr);
976d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr);
977d86155a6SBarry Smith     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
978d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%D, cols=%D \n",bA->nr,bA->nc);CHKERRQ(ierr);
979d8588912SDave May 
980d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr);
981d8588912SDave May     for (i=0; i<bA->nr; i++) {
982d8588912SDave May       for (j=0; j<bA->nc; j++) {
98319fd82e9SBarry Smith         MatType   type;
984270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
985d8588912SDave May         PetscInt  NR,NC;
986d8588912SDave May         PetscBool isNest = PETSC_FALSE;
987d8588912SDave May 
988d8588912SDave May         if (!bA->m[i][j]) {
98985019af4SBarry Smith           ierr = PetscViewerASCIIPrintf(viewer, "(%D,%D) : NULL \n",i,j);CHKERRQ(ierr);
990d8588912SDave May           continue;
991d8588912SDave May         }
992d8588912SDave May         ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr);
993d8588912SDave May         ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr);
9948caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);}
9958caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);}
996251f4c67SDmitry Karpeev         ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr);
997d8588912SDave May 
998270f95d7SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"(%D,%D) : %s%stype=%s, rows=%D, cols=%D \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr);
999d8588912SDave May 
100029e60adbSStefano Zampini         if (isNest || viewSub) {
1001270f95d7SJed Brown           ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);  /* push1 */
1002d8588912SDave May           ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr);
1003270f95d7SJed Brown           ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop1 */
1004d8588912SDave May         }
1005d8588912SDave May       }
1006d8588912SDave May     }
1007d86155a6SBarry Smith     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop0 */
1008d8588912SDave May   }
1009d8588912SDave May   PetscFunctionReturn(0);
1010d8588912SDave May }
1011d8588912SDave May 
1012207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
1013d8588912SDave May {
1014d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1015d8588912SDave May   PetscInt       i,j;
1016d8588912SDave May   PetscErrorCode ierr;
1017d8588912SDave May 
1018d8588912SDave May   PetscFunctionBegin;
1019d8588912SDave May   for (i=0; i<bA->nr; i++) {
1020d8588912SDave May     for (j=0; j<bA->nc; j++) {
1021d8588912SDave May       if (!bA->m[i][j]) continue;
1022d8588912SDave May       ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr);
1023d8588912SDave May     }
1024d8588912SDave May   }
1025d8588912SDave May   PetscFunctionReturn(0);
1026d8588912SDave May }
1027d8588912SDave May 
1028c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
1029c222c20dSDavid Ham {
1030c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
1031c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1032c222c20dSDavid Ham   PetscErrorCode ierr;
103306a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
1034c222c20dSDavid Ham 
1035c222c20dSDavid Ham   PetscFunctionBegin;
1036c222c20dSDavid Ham   if (nr != bB->nr || nc != bB->nc) SETERRQ4(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%D,%D) to a Mat_Nest of block size (%D,%D)",bB->nr,bB->nc,nr,nc);
1037c222c20dSDavid Ham   for (i=0; i<nr; i++) {
1038c222c20dSDavid Ham     for (j=0; j<nc; j++) {
103906a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
104046a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
1041c222c20dSDavid Ham         ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr);
104246a2b97cSJed Brown       } else if (bA->m[i][j] || bB->m[i][j]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
104306a1af2fSStefano Zampini       ierr = MatGetNonzeroState(bB->m[i][j],&subnnzstate);CHKERRQ(ierr);
104406a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate);
104506a1af2fSStefano Zampini       bB->nnzstate[i*nc+j] = subnnzstate;
1046c222c20dSDavid Ham     }
1047c222c20dSDavid Ham   }
104806a1af2fSStefano Zampini   if (nnzstate) B->nonzerostate++;
1049c222c20dSDavid Ham   PetscFunctionReturn(0);
1050c222c20dSDavid Ham }
1051c222c20dSDavid Ham 
10526e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
10536e76ffeaSPierre Jolivet {
10546e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
10556e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
10566e76ffeaSPierre Jolivet   PetscErrorCode ierr;
105706a1af2fSStefano Zampini   PetscBool      nnzstate = PETSC_FALSE;
10586e76ffeaSPierre Jolivet 
10596e76ffeaSPierre Jolivet   PetscFunctionBegin;
10606e76ffeaSPierre Jolivet   if (nr != bX->nr || nc != bX->nc) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%D,%D) with a MatNest of block size (%D,%D)",bX->nr,bX->nc,nr,nc);
10616e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
10626e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
106306a1af2fSStefano Zampini       PetscObjectState subnnzstate = 0;
10646e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
10656e76ffeaSPierre Jolivet         ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr);
1066c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
1067c066aebcSStefano Zampini         Mat M;
1068c066aebcSStefano Zampini 
1069060bfc19SStefano Zampini         if (str != DIFFERENT_NONZERO_PATTERN) SETERRQ2(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D. Use DIFFERENT_NONZERO_PATTERN",i,j);
1070c066aebcSStefano Zampini         ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr);
1071c066aebcSStefano Zampini         ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr);
1072c066aebcSStefano Zampini         ierr = MatDestroy(&M);CHKERRQ(ierr);
1073c066aebcSStefano Zampini       }
1074060bfc19SStefano Zampini       if (bY->m[i][j]) { ierr = MatGetNonzeroState(bY->m[i][j],&subnnzstate);CHKERRQ(ierr); }
107506a1af2fSStefano Zampini       nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate);
107606a1af2fSStefano Zampini       bY->nnzstate[i*nc+j] = subnnzstate;
10776e76ffeaSPierre Jolivet     }
10786e76ffeaSPierre Jolivet   }
107906a1af2fSStefano Zampini   if (nnzstate) Y->nonzerostate++;
10806e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
10816e76ffeaSPierre Jolivet }
10826e76ffeaSPierre Jolivet 
1083207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
1084d8588912SDave May {
1085d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
1086841e96a3SJed Brown   Mat            *b;
1087841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
1088d8588912SDave May   PetscErrorCode ierr;
1089d8588912SDave May 
1090d8588912SDave May   PetscFunctionBegin;
1091785e854fSJed Brown   ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr);
1092841e96a3SJed Brown   for (i=0; i<nr; i++) {
1093841e96a3SJed Brown     for (j=0; j<nc; j++) {
1094841e96a3SJed Brown       if (bA->m[i][j]) {
1095841e96a3SJed Brown         ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr);
1096841e96a3SJed Brown       } else {
10970298fd71SBarry Smith         b[i*nc+j] = NULL;
1098d8588912SDave May       }
1099d8588912SDave May     }
1100d8588912SDave May   }
1101ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr);
1102841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
1103841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
11046bf464f9SBarry Smith     ierr = MatDestroy(&b[i]);CHKERRQ(ierr);
1105d8588912SDave May   }
1106d8588912SDave May   ierr = PetscFree(b);CHKERRQ(ierr);
1107d8588912SDave May 
1108841e96a3SJed Brown   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1109841e96a3SJed Brown   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1110d8588912SDave May   PetscFunctionReturn(0);
1111d8588912SDave May }
1112d8588912SDave May 
1113d8588912SDave May /* nest api */
1114d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
1115d8588912SDave May {
1116d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
11175fd66863SKarl Rupp 
1118d8588912SDave May   PetscFunctionBegin;
1119ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1120ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
1121d8588912SDave May   *mat = bA->m[idxm][jdxm];
1122d8588912SDave May   PetscFunctionReturn(0);
1123d8588912SDave May }
1124d8588912SDave May 
11259ba0d327SJed Brown /*@
1126d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
1127d8588912SDave May 
1128d8588912SDave May  Not collective
1129d8588912SDave May 
1130d8588912SDave May  Input Parameters:
1131629881c0SJed Brown +   A  - nest matrix
1132d8588912SDave May .   idxm - index of the matrix within the nest matrix
1133629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
1134d8588912SDave May 
1135d8588912SDave May  Output Parameter:
1136d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
1137d8588912SDave May 
1138d8588912SDave May  Level: developer
1139d8588912SDave May 
1140bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(),
114179798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
1142d8588912SDave May @*/
11437087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
1144d8588912SDave May {
1145699a902aSJed Brown   PetscErrorCode ierr;
1146d8588912SDave May 
1147d8588912SDave May   PetscFunctionBegin;
1148699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr);
1149d8588912SDave May   PetscFunctionReturn(0);
1150d8588912SDave May }
1151d8588912SDave May 
11520782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
11530782ca92SJed Brown {
11540782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
11550782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
11560782ca92SJed Brown   PetscErrorCode ierr;
11570782ca92SJed Brown 
11580782ca92SJed Brown   PetscFunctionBegin;
1159ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
1160ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
11610782ca92SJed Brown   ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr);
11620782ca92SJed Brown   ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr);
11630782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr);
11640782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr);
11650782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr);
11660782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr);
1167ce94432eSBarry Smith   if (M != Mi || N != Ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%D,%D) incompatible with nest block (%D,%D)",M,N,Mi,Ni);
1168ce94432eSBarry Smith   if (m != mi || n != ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%D,%D) incompatible with nest block (%D,%D)",m,n,mi,ni);
116926fbe8dcSKarl Rupp 
117006a1af2fSStefano Zampini   /* do not increase object state */
117106a1af2fSStefano Zampini   if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0);
117206a1af2fSStefano Zampini 
11730782ca92SJed Brown   ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr);
11740782ca92SJed Brown   ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr);
11750782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
117606a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
117706a1af2fSStefano Zampini   ierr = MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]);CHKERRQ(ierr);
117806a1af2fSStefano Zampini   A->nonzerostate++;
11790782ca92SJed Brown   PetscFunctionReturn(0);
11800782ca92SJed Brown }
11810782ca92SJed Brown 
11829ba0d327SJed Brown /*@
11830782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
11840782ca92SJed Brown 
11850782ca92SJed Brown  Logically collective on the submatrix communicator
11860782ca92SJed Brown 
11870782ca92SJed Brown  Input Parameters:
11880782ca92SJed Brown +   A  - nest matrix
11890782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
11900782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
11910782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
11920782ca92SJed Brown 
11930782ca92SJed Brown  Notes:
11940782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
11950782ca92SJed Brown 
11960782ca92SJed Brown  This increments the reference count of the submatrix.
11970782ca92SJed Brown 
11980782ca92SJed Brown  Level: developer
11990782ca92SJed Brown 
1200bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
120179798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
12020782ca92SJed Brown @*/
12030782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
12040782ca92SJed Brown {
12050782ca92SJed Brown   PetscErrorCode ierr;
12060782ca92SJed Brown 
12070782ca92SJed Brown   PetscFunctionBegin;
12080782ca92SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr);
12090782ca92SJed Brown   PetscFunctionReturn(0);
12100782ca92SJed Brown }
12110782ca92SJed Brown 
1212d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1213d8588912SDave May {
1214d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
12155fd66863SKarl Rupp 
1216d8588912SDave May   PetscFunctionBegin;
121726fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
121826fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
121926fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1220d8588912SDave May   PetscFunctionReturn(0);
1221d8588912SDave May }
1222d8588912SDave May 
1223d8588912SDave May /*@C
1224d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1225d8588912SDave May 
1226d8588912SDave May  Not collective
1227d8588912SDave May 
1228d8588912SDave May  Input Parameters:
1229629881c0SJed Brown .   A  - nest matrix
1230d8588912SDave May 
1231d8588912SDave May  Output Parameter:
1232629881c0SJed Brown +   M - number of rows in the nest matrix
1233d8588912SDave May .   N - number of cols in the nest matrix
1234629881c0SJed Brown -   mat - 2d array of matrices
1235d8588912SDave May 
1236d8588912SDave May  Notes:
1237d8588912SDave May 
1238d8588912SDave May  The user should not free the array mat.
1239d8588912SDave May 
1240351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1241351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1242351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1243351962e3SVincent Le Chenadec 
1244d8588912SDave May  Level: developer
1245d8588912SDave May 
1246bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(),
124779798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1248d8588912SDave May @*/
12497087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1250d8588912SDave May {
1251699a902aSJed Brown   PetscErrorCode ierr;
1252d8588912SDave May 
1253d8588912SDave May   PetscFunctionBegin;
1254699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr);
1255d8588912SDave May   PetscFunctionReturn(0);
1256d8588912SDave May }
1257d8588912SDave May 
12587087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1259d8588912SDave May {
1260d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1261d8588912SDave May 
1262d8588912SDave May   PetscFunctionBegin;
126326fbe8dcSKarl Rupp   if (M) *M = bA->nr;
126426fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1265d8588912SDave May   PetscFunctionReturn(0);
1266d8588912SDave May }
1267d8588912SDave May 
12689ba0d327SJed Brown /*@
1269d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1270d8588912SDave May 
1271d8588912SDave May  Not collective
1272d8588912SDave May 
1273d8588912SDave May  Input Parameters:
1274d8588912SDave May .   A  - nest matrix
1275d8588912SDave May 
1276d8588912SDave May  Output Parameter:
1277629881c0SJed Brown +   M - number of rows in the nested mat
1278629881c0SJed Brown -   N - number of cols in the nested mat
1279d8588912SDave May 
1280d8588912SDave May  Notes:
1281d8588912SDave May 
1282d8588912SDave May  Level: developer
1283d8588912SDave May 
1284bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(),
128579798668SBarry Smith           MatNestGetISs()
1286d8588912SDave May @*/
12877087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1288d8588912SDave May {
1289699a902aSJed Brown   PetscErrorCode ierr;
1290d8588912SDave May 
1291d8588912SDave May   PetscFunctionBegin;
1292699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr);
1293d8588912SDave May   PetscFunctionReturn(0);
1294d8588912SDave May }
1295d8588912SDave May 
1296f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1297900e7ff2SJed Brown {
1298900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1299900e7ff2SJed Brown   PetscInt i;
1300900e7ff2SJed Brown 
1301900e7ff2SJed Brown   PetscFunctionBegin;
1302900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1303900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1304900e7ff2SJed Brown   PetscFunctionReturn(0);
1305900e7ff2SJed Brown }
1306900e7ff2SJed Brown 
13073a4d7b9aSSatish Balay /*@C
1308900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1309900e7ff2SJed Brown 
1310900e7ff2SJed Brown  Not collective
1311900e7ff2SJed Brown 
1312900e7ff2SJed Brown  Input Parameters:
1313900e7ff2SJed Brown .   A  - nest matrix
1314900e7ff2SJed Brown 
1315900e7ff2SJed Brown  Output Parameter:
1316900e7ff2SJed Brown +   rows - array of row index sets
1317900e7ff2SJed Brown -   cols - array of column index sets
1318900e7ff2SJed Brown 
1319900e7ff2SJed Brown  Level: advanced
1320900e7ff2SJed Brown 
1321900e7ff2SJed Brown  Notes:
1322900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1323900e7ff2SJed Brown 
132479798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1325bb97c47cSPierre Jolivet           MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats()
1326900e7ff2SJed Brown @*/
1327900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1328900e7ff2SJed Brown {
1329900e7ff2SJed Brown   PetscErrorCode ierr;
1330900e7ff2SJed Brown 
1331900e7ff2SJed Brown   PetscFunctionBegin;
1332900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1333900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1334900e7ff2SJed Brown   PetscFunctionReturn(0);
1335900e7ff2SJed Brown }
1336900e7ff2SJed Brown 
1337f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1338900e7ff2SJed Brown {
1339900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1340900e7ff2SJed Brown   PetscInt i;
1341900e7ff2SJed Brown 
1342900e7ff2SJed Brown   PetscFunctionBegin;
1343900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1344900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1345900e7ff2SJed Brown   PetscFunctionReturn(0);
1346900e7ff2SJed Brown }
1347900e7ff2SJed Brown 
1348900e7ff2SJed Brown /*@C
1349900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1350900e7ff2SJed Brown 
1351900e7ff2SJed Brown  Not collective
1352900e7ff2SJed Brown 
1353900e7ff2SJed Brown  Input Parameters:
1354900e7ff2SJed Brown .   A  - nest matrix
1355900e7ff2SJed Brown 
1356900e7ff2SJed Brown  Output Parameter:
13570298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
13580298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1359900e7ff2SJed Brown 
1360900e7ff2SJed Brown  Level: advanced
1361900e7ff2SJed Brown 
1362900e7ff2SJed Brown  Notes:
1363900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1364900e7ff2SJed Brown 
1365bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(),
136679798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1367900e7ff2SJed Brown @*/
1368900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1369900e7ff2SJed Brown {
1370900e7ff2SJed Brown   PetscErrorCode ierr;
1371900e7ff2SJed Brown 
1372900e7ff2SJed Brown   PetscFunctionBegin;
1373900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1374900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1375900e7ff2SJed Brown   PetscFunctionReturn(0);
1376900e7ff2SJed Brown }
1377900e7ff2SJed Brown 
137819fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1379207556f9SJed Brown {
1380207556f9SJed Brown   PetscErrorCode ierr;
1381207556f9SJed Brown   PetscBool      flg;
1382207556f9SJed Brown 
1383207556f9SJed Brown   PetscFunctionBegin;
1384207556f9SJed Brown   ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr);
1385207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
13862a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
138712b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1388207556f9SJed Brown   PetscFunctionReturn(0);
1389207556f9SJed Brown }
1390207556f9SJed Brown 
1391207556f9SJed Brown /*@C
13922a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1393207556f9SJed Brown 
1394207556f9SJed Brown  Not collective
1395207556f9SJed Brown 
1396207556f9SJed Brown  Input Parameters:
1397207556f9SJed Brown +  A  - nest matrix
1398207556f9SJed Brown -  vtype - type to use for creating vectors
1399207556f9SJed Brown 
1400207556f9SJed Brown  Notes:
1401207556f9SJed Brown 
1402207556f9SJed Brown  Level: developer
1403207556f9SJed Brown 
1404bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest()
1405207556f9SJed Brown @*/
140619fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1407207556f9SJed Brown {
1408207556f9SJed Brown   PetscErrorCode ierr;
1409207556f9SJed Brown 
1410207556f9SJed Brown   PetscFunctionBegin;
141119fd82e9SBarry Smith   ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr);
1412207556f9SJed Brown   PetscFunctionReturn(0);
1413207556f9SJed Brown }
1414207556f9SJed Brown 
1415c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1416d8588912SDave May {
1417c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1418c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
1419d8588912SDave May   PetscErrorCode ierr;
142006a1af2fSStefano Zampini   PetscBool      cong;
1421d8588912SDave May 
1422d8588912SDave May   PetscFunctionBegin;
142306a1af2fSStefano Zampini   ierr = MatReset_Nest(A);CHKERRQ(ierr);
142406a1af2fSStefano Zampini 
1425c8883902SJed Brown   s->nr = nr;
1426c8883902SJed Brown   s->nc = nc;
1427d8588912SDave May 
1428c8883902SJed Brown   /* Create space for submatrices */
1429854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr);
1430c8883902SJed Brown   for (i=0; i<nr; i++) {
1431854ce69bSBarry Smith     ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr);
1432d8588912SDave May   }
1433c8883902SJed Brown   for (i=0; i<nr; i++) {
1434c8883902SJed Brown     for (j=0; j<nc; j++) {
1435c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1436c8883902SJed Brown       if (a[i*nc+j]) {
1437c8883902SJed Brown         ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr);
1438d8588912SDave May       }
1439d8588912SDave May     }
1440d8588912SDave May   }
1441d8588912SDave May 
14428188e55aSJed Brown   ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr);
1443d8588912SDave May 
1444854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr);
1445854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr);
1446c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1447c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1448d8588912SDave May 
144906a1af2fSStefano Zampini   ierr = PetscCalloc1(nr*nc,&s->nnzstate);CHKERRQ(ierr);
145006a1af2fSStefano Zampini   for (i=0; i<nr; i++) {
145106a1af2fSStefano Zampini     for (j=0; j<nc; j++) {
145206a1af2fSStefano Zampini       if (s->m[i][j]) {
145306a1af2fSStefano Zampini         ierr = MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]);CHKERRQ(ierr);
145406a1af2fSStefano Zampini       }
145506a1af2fSStefano Zampini     }
145606a1af2fSStefano Zampini   }
145706a1af2fSStefano Zampini 
14588188e55aSJed Brown   ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr);
1459d8588912SDave May 
1460c8883902SJed Brown   ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr);
1461c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr);
1462c8883902SJed Brown   ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr);
1463c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr);
1464c8883902SJed Brown 
1465c8883902SJed Brown   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
1466c8883902SJed Brown   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
1467c8883902SJed Brown 
146806a1af2fSStefano Zampini   /* disable operations that are not supported for non-square matrices,
146906a1af2fSStefano Zampini      or matrices for which is_row != is_col  */
147006a1af2fSStefano Zampini   ierr = MatHasCongruentLayouts(A,&cong);CHKERRQ(ierr);
147106a1af2fSStefano Zampini   if (cong && nr != nc) cong = PETSC_FALSE;
147206a1af2fSStefano Zampini   if (cong) {
147306a1af2fSStefano Zampini     for (i = 0; cong && i < nr; i++) {
1474320466b0SStefano Zampini       ierr = ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong);CHKERRQ(ierr);
147506a1af2fSStefano Zampini     }
147606a1af2fSStefano Zampini   }
147706a1af2fSStefano Zampini   if (!cong) {
1478381b8e50SStefano Zampini     A->ops->missingdiagonal = NULL;
147906a1af2fSStefano Zampini     A->ops->getdiagonal     = NULL;
148006a1af2fSStefano Zampini     A->ops->shift           = NULL;
148106a1af2fSStefano Zampini     A->ops->diagonalset     = NULL;
148206a1af2fSStefano Zampini   }
148306a1af2fSStefano Zampini 
14841795a4d1SJed Brown   ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr);
148506a1af2fSStefano Zampini   ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr);
148606a1af2fSStefano Zampini   A->nonzerostate++;
1487d8588912SDave May   PetscFunctionReturn(0);
1488d8588912SDave May }
1489d8588912SDave May 
1490c8883902SJed Brown /*@
1491c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1492c8883902SJed Brown 
1493c8883902SJed Brown    Collective on Mat
1494c8883902SJed Brown 
1495c8883902SJed Brown    Input Parameter:
1496ffd6319bSRichard Tran Mills +  A - nested matrix
1497c8883902SJed Brown .  nr - number of nested row blocks
14980298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1499c8883902SJed Brown .  nc - number of nested column blocks
15000298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
15010298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1502c8883902SJed Brown 
150306a1af2fSStefano Zampini    Notes: this always resets any submatrix information previously set
150406a1af2fSStefano Zampini 
1505c8883902SJed Brown    Level: advanced
1506c8883902SJed Brown 
150779798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1508c8883902SJed Brown @*/
1509c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1510c8883902SJed Brown {
1511c8883902SJed Brown   PetscErrorCode ierr;
151206a1af2fSStefano Zampini   PetscInt       i;
1513c8883902SJed Brown 
1514c8883902SJed Brown   PetscFunctionBegin;
1515c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1516ce94432eSBarry Smith   if (nr < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1517c8883902SJed Brown   if (nr && is_row) {
1518c8883902SJed Brown     PetscValidPointer(is_row,3);
1519c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1520c8883902SJed Brown   }
1521ce94432eSBarry Smith   if (nc < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
15221664e352SJed Brown   if (nc && is_col) {
1523c8883902SJed Brown     PetscValidPointer(is_col,5);
15249b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1525c8883902SJed Brown   }
152606a1af2fSStefano Zampini   if (nr*nc > 0) PetscValidPointer(a,6);
1527c8883902SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr);
1528c8883902SJed Brown   PetscFunctionReturn(0);
1529c8883902SJed Brown }
1530d8588912SDave May 
153145b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
153277019fcaSJed Brown {
153377019fcaSJed Brown   PetscErrorCode ierr;
153477019fcaSJed Brown   PetscBool      flg;
153577019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
153677019fcaSJed Brown 
153777019fcaSJed Brown   PetscFunctionBegin;
1538aea6d515SStefano Zampini   *ltog = NULL;
153977019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
154077019fcaSJed Brown     if (islocal[i]) {
1541aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
154277019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
154377019fcaSJed Brown     } else {
1544aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
154577019fcaSJed Brown     }
154677019fcaSJed Brown     m += mi;
154777019fcaSJed Brown   }
1548aea6d515SStefano Zampini   if (!flg) PetscFunctionReturn(0);
1549aea6d515SStefano Zampini 
1550785e854fSJed Brown   ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr);
1551165cd838SBarry Smith   for (i=0,m=0; i<n; i++) {
15520298fd71SBarry Smith     ISLocalToGlobalMapping smap = NULL;
1553e108cb99SStefano Zampini     Mat                    sub = NULL;
1554f6d38dbbSStefano Zampini     PetscSF                sf;
1555f6d38dbbSStefano Zampini     PetscLayout            map;
1556aea6d515SStefano Zampini     const PetscInt         *ix2;
155777019fcaSJed Brown 
1558165cd838SBarry Smith     if (!colflg) {
155977019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
156077019fcaSJed Brown     } else {
156177019fcaSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
156277019fcaSJed Brown     }
1563191fd14bSBarry Smith     if (sub) {
1564191fd14bSBarry Smith       if (!colflg) {
1565191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr);
1566191fd14bSBarry Smith       } else {
1567191fd14bSBarry Smith         ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr);
1568191fd14bSBarry Smith       }
1569191fd14bSBarry Smith     }
157077019fcaSJed Brown     /*
157177019fcaSJed Brown        Now we need to extract the monolithic global indices that correspond to the given split global indices.
157277019fcaSJed Brown        In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
157377019fcaSJed Brown     */
1574aea6d515SStefano Zampini     ierr = ISGetIndices(isglobal[i],&ix2);CHKERRQ(ierr);
1575aea6d515SStefano Zampini     if (islocal[i]) {
1576aea6d515SStefano Zampini       PetscInt *ilocal,*iremote;
1577aea6d515SStefano Zampini       PetscInt mil,nleaves;
1578aea6d515SStefano Zampini 
1579aea6d515SStefano Zampini       ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr);
1580aea6d515SStefano Zampini       if (!smap) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map");
1581aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = j;
1582aea6d515SStefano Zampini       ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr);
1583aea6d515SStefano Zampini 
1584aea6d515SStefano Zampini       /* PetscSFSetGraphLayout does not like negative indices */
1585aea6d515SStefano Zampini       ierr = PetscMalloc2(mi,&ilocal,mi,&iremote);CHKERRQ(ierr);
1586aea6d515SStefano Zampini       for (j=0, nleaves = 0; j<mi; j++) {
1587aea6d515SStefano Zampini         if (ix[m+j] < 0) continue;
1588aea6d515SStefano Zampini         ilocal[nleaves]  = j;
1589aea6d515SStefano Zampini         iremote[nleaves] = ix[m+j];
1590aea6d515SStefano Zampini         nleaves++;
1591aea6d515SStefano Zampini       }
1592aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mil);CHKERRQ(ierr);
1593aea6d515SStefano Zampini       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A),&sf);CHKERRQ(ierr);
1594aea6d515SStefano Zampini       ierr = PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map);CHKERRQ(ierr);
1595aea6d515SStefano Zampini       ierr = PetscLayoutSetLocalSize(map,mil);CHKERRQ(ierr);
1596f6d38dbbSStefano Zampini       ierr = PetscLayoutSetUp(map);CHKERRQ(ierr);
1597aea6d515SStefano Zampini       ierr = PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote);CHKERRQ(ierr);
1598f6d38dbbSStefano Zampini       ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr);
1599f6d38dbbSStefano Zampini       ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1600f6d38dbbSStefano Zampini       ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1601f6d38dbbSStefano Zampini       ierr = PetscSFDestroy(&sf);CHKERRQ(ierr);
1602aea6d515SStefano Zampini       ierr = PetscFree2(ilocal,iremote);CHKERRQ(ierr);
1603aea6d515SStefano Zampini     } else {
1604aea6d515SStefano Zampini       ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr);
1605aea6d515SStefano Zampini       for (j=0; j<mi; j++) ix[m+j] = ix2[i];
1606aea6d515SStefano Zampini     }
1607aea6d515SStefano Zampini     ierr = ISRestoreIndices(isglobal[i],&ix2);CHKERRQ(ierr);
160877019fcaSJed Brown     m   += mi;
160977019fcaSJed Brown   }
1610f0413b6fSBarry Smith   ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr);
161177019fcaSJed Brown   PetscFunctionReturn(0);
161277019fcaSJed Brown }
161377019fcaSJed Brown 
161477019fcaSJed Brown 
1615d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1616d8588912SDave May /*
1617d8588912SDave May   nprocessors = NP
1618d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1619d8588912SDave May        proc 0: => (g_0,h_0,)
1620d8588912SDave May        proc 1: => (g_1,h_1,)
1621d8588912SDave May        ...
1622d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1623d8588912SDave May 
1624d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1625d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1626d8588912SDave May 
1627d8588912SDave May             proc 0:
1628d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1629d8588912SDave May             proc 1:
1630d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1631d8588912SDave May 
1632d8588912SDave May             proc NP-1:
1633d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1634d8588912SDave May */
1635841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1636d8588912SDave May {
1637e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
16388188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
1639d8588912SDave May   PetscErrorCode ierr;
16400298fd71SBarry Smith   Mat            sub = NULL;
1641d8588912SDave May 
1642d8588912SDave May   PetscFunctionBegin;
1643854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr);
1644854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr);
1645d8588912SDave May   if (is_row) { /* valid IS is passed in */
1646d8588912SDave May     /* refs on is[] are incremeneted */
1647e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1648d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr);
164926fbe8dcSKarl Rupp 
1650e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1651d8588912SDave May     }
16522ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
16538188e55aSJed Brown     nsum = 0;
16548188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
16558188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
1656ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %D",i);
16570298fd71SBarry Smith       ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
1658ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16598188e55aSJed Brown       nsum += n;
16608188e55aSJed Brown     }
166155b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
166230bc264bSJed Brown     offset -= nsum;
1663e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1664f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
16650298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
166673b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1667ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr);
1668e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr);
16692ae74bdbSJed Brown       offset += n;
1670d8588912SDave May     }
1671d8588912SDave May   }
1672d8588912SDave May 
1673d8588912SDave May   if (is_col) { /* valid IS is passed in */
1674d8588912SDave May     /* refs on is[] are incremeneted */
1675e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1676d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr);
167726fbe8dcSKarl Rupp 
1678e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1679d8588912SDave May     }
16802ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
16812ae74bdbSJed Brown     offset = A->cmap->rstart;
16828188e55aSJed Brown     nsum   = 0;
16838188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
16848188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
1685ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %D",i);
16860298fd71SBarry Smith       ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
1687ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
16888188e55aSJed Brown       nsum += n;
16898188e55aSJed Brown     }
169055b25c41SPierre Jolivet     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr);
169130bc264bSJed Brown     offset -= nsum;
1692e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1693f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
16940298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
169573b6653fSLawrence Mitchell       ierr    = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1696ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr);
1697e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr);
16982ae74bdbSJed Brown       offset += n;
1699d8588912SDave May     }
1700d8588912SDave May   }
1701e2d7f03fSJed Brown 
1702e2d7f03fSJed Brown   /* Set up the local ISs */
1703785e854fSJed Brown   ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
1704785e854fSJed Brown   ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
1705e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1706e2d7f03fSJed Brown     IS                     isloc;
17070298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1708e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1709e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
17100298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);}
1711207556f9SJed Brown     if (rmap) {
171273b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr);
1713e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr);
1714e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1715e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1716207556f9SJed Brown     } else {
1717207556f9SJed Brown       nlocal = 0;
17180298fd71SBarry Smith       isloc  = NULL;
1719207556f9SJed Brown     }
1720e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1721e2d7f03fSJed Brown     offset            += nlocal;
1722e2d7f03fSJed Brown   }
17238188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1724e2d7f03fSJed Brown     IS                     isloc;
17250298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1726e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1727e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
17280298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);}
1729207556f9SJed Brown     if (cmap) {
173073b6653fSLawrence Mitchell       ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr);
1731e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr);
1732e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1733e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1734207556f9SJed Brown     } else {
1735207556f9SJed Brown       nlocal = 0;
17360298fd71SBarry Smith       isloc  = NULL;
1737207556f9SJed Brown     }
1738e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1739e2d7f03fSJed Brown     offset            += nlocal;
1740e2d7f03fSJed Brown   }
17410189643fSJed Brown 
174277019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
174377019fcaSJed Brown   {
174445b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
174545b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr);
174645b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr);
174777019fcaSJed Brown     if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);}
174877019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr);
174977019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr);
175077019fcaSJed Brown   }
175177019fcaSJed Brown 
175276bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
17530189643fSJed Brown     for (i=0; i<vs->nr; i++) {
17540189643fSJed Brown       for (j=0; j<vs->nc; j++) {
17550189643fSJed Brown         PetscInt m,n,M,N,mi,ni,Mi,Ni;
17560189643fSJed Brown         Mat      B = vs->m[i][j];
17570189643fSJed Brown         if (!B) continue;
17580189643fSJed Brown         ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr);
17590189643fSJed Brown         ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr);
17600189643fSJed Brown         ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr);
17610189643fSJed Brown         ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr);
17620189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr);
17630189643fSJed Brown         ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr);
1764ce94432eSBarry Smith         if (M != Mi || N != Ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",M,N,i,j,Mi,Ni);
1765ce94432eSBarry Smith         if (m != mi || n != ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",m,n,i,j,mi,ni);
17660189643fSJed Brown       }
17670189643fSJed Brown     }
176876bd3646SJed Brown   }
1769a061e289SJed Brown 
1770a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1771a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1772a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1773a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1774a061e289SJed Brown     }
1775a061e289SJed Brown   }
1776a061e289SJed Brown   A->assembled = PETSC_TRUE;
1777d8588912SDave May   PetscFunctionReturn(0);
1778d8588912SDave May }
1779d8588912SDave May 
178045c38901SJed Brown /*@C
1781659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1782659c6bb0SJed Brown 
1783659c6bb0SJed Brown    Collective on Mat
1784659c6bb0SJed Brown 
1785659c6bb0SJed Brown    Input Parameter:
1786659c6bb0SJed Brown +  comm - Communicator for the new Mat
1787659c6bb0SJed Brown .  nr - number of nested row blocks
17880298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1789659c6bb0SJed Brown .  nc - number of nested column blocks
17900298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
17910298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1792659c6bb0SJed Brown 
1793659c6bb0SJed Brown    Output Parameter:
1794659c6bb0SJed Brown .  B - new matrix
1795659c6bb0SJed Brown 
1796659c6bb0SJed Brown    Level: advanced
1797659c6bb0SJed Brown 
179879798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
179979798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
180079798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1801659c6bb0SJed Brown @*/
18027087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1803d8588912SDave May {
1804d8588912SDave May   Mat            A;
1805d8588912SDave May   PetscErrorCode ierr;
1806d8588912SDave May 
1807d8588912SDave May   PetscFunctionBegin;
1808f4259b30SLisandro Dalcin   *B   = NULL;
1809d8588912SDave May   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
1810c8883902SJed Brown   ierr = MatSetType(A,MATNEST);CHKERRQ(ierr);
181191a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
1812c8883902SJed Brown   ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr);
1813d8588912SDave May   *B   = A;
1814d8588912SDave May   PetscFunctionReturn(0);
1815d8588912SDave May }
1816659c6bb0SJed Brown 
1817be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1818b68353e5Sstefano_zampini {
1819b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
182023875855Sstefano_zampini   Mat            *trans;
1821b68353e5Sstefano_zampini   PetscScalar    **avv;
1822b68353e5Sstefano_zampini   PetscScalar    *vv;
1823b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1824b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1825b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1826b68353e5Sstefano_zampini   PetscBool      done;
1827b68353e5Sstefano_zampini   PetscErrorCode ierr;
1828b68353e5Sstefano_zampini 
1829b68353e5Sstefano_zampini   PetscFunctionBegin;
1830b68353e5Sstefano_zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
1831b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1832b68353e5Sstefano_zampini     PetscInt rnr;
1833b68353e5Sstefano_zampini 
1834b68353e5Sstefano_zampini     ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
1835b68353e5Sstefano_zampini     if (!done) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
1836b68353e5Sstefano_zampini     if (rnr != nr) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
1837b68353e5Sstefano_zampini     ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr);
1838b68353e5Sstefano_zampini   }
1839b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1840b68353e5Sstefano_zampini   nnz  = 0;
184123875855Sstefano_zampini   ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr);
1842b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1843b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1844b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1845b68353e5Sstefano_zampini       if (B) {
1846b68353e5Sstefano_zampini         PetscScalar *naa;
1847b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
184823875855Sstefano_zampini         PetscBool   istrans;
1849b68353e5Sstefano_zampini 
185023875855Sstefano_zampini         ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
185123875855Sstefano_zampini         if (istrans) {
185223875855Sstefano_zampini           Mat Bt;
185323875855Sstefano_zampini 
185423875855Sstefano_zampini           ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
185523875855Sstefano_zampini           ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr);
185623875855Sstefano_zampini           B    = trans[i*nest->nc+j];
185723875855Sstefano_zampini         }
1858b68353e5Sstefano_zampini         ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr);
1859b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
1860b68353e5Sstefano_zampini         ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr);
1861b68353e5Sstefano_zampini         nnz += nii[nnr];
1862b68353e5Sstefano_zampini 
1863b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1864b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1865b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1866b68353e5Sstefano_zampini       }
1867b68353e5Sstefano_zampini     }
1868b68353e5Sstefano_zampini   }
1869b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
1870b68353e5Sstefano_zampini     ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr);
1871b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr);
1872b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr);
1873b68353e5Sstefano_zampini   } else {
1874b68353e5Sstefano_zampini     if (nnz != ii[nr]) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1875b68353e5Sstefano_zampini   }
1876b68353e5Sstefano_zampini 
1877b68353e5Sstefano_zampini   /* new row pointer */
1878580bdb30SBarry Smith   ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr);
1879b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1880b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1881b68353e5Sstefano_zampini 
1882b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1883b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1884b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1885b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1886b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1887b68353e5Sstefano_zampini         PetscInt    ir;
1888b68353e5Sstefano_zampini 
1889b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1890b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1891b68353e5Sstefano_zampini           nii++;
1892b68353e5Sstefano_zampini         }
1893b68353e5Sstefano_zampini       }
1894b68353e5Sstefano_zampini     }
1895b68353e5Sstefano_zampini   }
1896b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1897b68353e5Sstefano_zampini 
1898b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
1899b68353e5Sstefano_zampini   ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr);
1900b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1901b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1902b68353e5Sstefano_zampini 
1903b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1904b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1905b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1906b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1907b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1908b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1909b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1910b68353e5Sstefano_zampini         PetscInt    ir,cst;
1911b68353e5Sstefano_zampini 
1912b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr);
1913b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1914b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1915b68353e5Sstefano_zampini 
1916b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1917b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1918b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1919b68353e5Sstefano_zampini             njj++;
1920b68353e5Sstefano_zampini             nvv++;
1921b68353e5Sstefano_zampini           }
1922b68353e5Sstefano_zampini           ci[ir] += rsize;
1923b68353e5Sstefano_zampini           nii++;
1924b68353e5Sstefano_zampini         }
1925b68353e5Sstefano_zampini       }
1926b68353e5Sstefano_zampini     }
1927b68353e5Sstefano_zampini   }
1928b68353e5Sstefano_zampini   ierr = PetscFree(ci);CHKERRQ(ierr);
1929b68353e5Sstefano_zampini 
1930b68353e5Sstefano_zampini   /* restore info */
1931b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1932b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1933b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1934b68353e5Sstefano_zampini       if (B) {
1935b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
193623875855Sstefano_zampini 
193723875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
1938b68353e5Sstefano_zampini         ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr);
1939b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
1940b68353e5Sstefano_zampini         ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr);
194123875855Sstefano_zampini         ierr = MatDestroy(&trans[k]);CHKERRQ(ierr);
1942b68353e5Sstefano_zampini       }
1943b68353e5Sstefano_zampini     }
1944b68353e5Sstefano_zampini   }
194523875855Sstefano_zampini   ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr);
1946b68353e5Sstefano_zampini 
1947b68353e5Sstefano_zampini   /* finalize newmat */
1948b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
1949b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr);
1950b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1951b68353e5Sstefano_zampini     Mat B;
1952b68353e5Sstefano_zampini 
1953b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr);
1954b68353e5Sstefano_zampini     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
1955b68353e5Sstefano_zampini   }
1956b68353e5Sstefano_zampini   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1957b68353e5Sstefano_zampini   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1958b68353e5Sstefano_zampini   {
1959b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1960b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1961b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1962b68353e5Sstefano_zampini   }
1963b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1964b68353e5Sstefano_zampini }
1965b68353e5Sstefano_zampini 
1966be705e3aSPierre Jolivet PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y,PetscScalar a,Mat X)
1967be705e3aSPierre Jolivet {
1968be705e3aSPierre Jolivet   Mat_Nest       *nest = (Mat_Nest*)X->data;
1969be705e3aSPierre Jolivet   PetscInt       i,j,k,rstart;
1970be705e3aSPierre Jolivet   PetscBool      flg;
1971be705e3aSPierre Jolivet   PetscErrorCode ierr;
1972be705e3aSPierre Jolivet 
1973be705e3aSPierre Jolivet   PetscFunctionBegin;
1974be705e3aSPierre Jolivet   /* Fill by row */
1975be705e3aSPierre Jolivet   for (j=0; j<nest->nc; ++j) {
1976be705e3aSPierre Jolivet     /* Using global column indices and ISAllGather() is not scalable. */
1977be705e3aSPierre Jolivet     IS             bNis;
1978be705e3aSPierre Jolivet     PetscInt       bN;
1979be705e3aSPierre Jolivet     const PetscInt *bNindices;
1980be705e3aSPierre Jolivet     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
1981be705e3aSPierre Jolivet     ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr);
1982be705e3aSPierre Jolivet     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
1983be705e3aSPierre Jolivet     for (i=0; i<nest->nr; ++i) {
1984be705e3aSPierre Jolivet       Mat            B,D=NULL;
1985be705e3aSPierre Jolivet       PetscInt       bm, br;
1986be705e3aSPierre Jolivet       const PetscInt *bmindices;
1987be705e3aSPierre Jolivet       B = nest->m[i][j];
1988be705e3aSPierre Jolivet       if (!B) continue;
1989be705e3aSPierre Jolivet       ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&flg);CHKERRQ(ierr);
1990be705e3aSPierre Jolivet       if (flg) {
1991be705e3aSPierre Jolivet         ierr = PetscTryMethod(B,"MatTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr);
1992be705e3aSPierre Jolivet         ierr = PetscTryMethod(B,"MatHermitianTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr);
1993be705e3aSPierre Jolivet         ierr = MatConvert(B,((PetscObject)D)->type_name,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr);
1994be705e3aSPierre Jolivet         B = D;
1995be705e3aSPierre Jolivet       }
1996be705e3aSPierre Jolivet       ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQSBAIJ,MATMPISBAIJ,"");CHKERRQ(ierr);
1997be705e3aSPierre Jolivet       if (flg) {
1998be705e3aSPierre Jolivet         if (D) {
1999be705e3aSPierre Jolivet           ierr = MatConvert(D,MATBAIJ,MAT_INPLACE_MATRIX,&D);CHKERRQ(ierr);
2000be705e3aSPierre Jolivet         } else {
2001be705e3aSPierre Jolivet           ierr = MatConvert(B,MATBAIJ,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr);
2002be705e3aSPierre Jolivet         }
2003be705e3aSPierre Jolivet         B = D;
2004be705e3aSPierre Jolivet       }
2005be705e3aSPierre Jolivet       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2006be705e3aSPierre Jolivet       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2007be705e3aSPierre Jolivet       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2008be705e3aSPierre Jolivet       for (br = 0; br < bm; ++br) {
2009be705e3aSPierre Jolivet         PetscInt          row = bmindices[br], brncols, *cols;
2010be705e3aSPierre Jolivet         const PetscInt    *brcols;
2011be705e3aSPierre Jolivet         const PetscScalar *brcoldata;
2012be705e3aSPierre Jolivet         PetscScalar       *vals = NULL;
2013be705e3aSPierre Jolivet         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2014be705e3aSPierre Jolivet         ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr);
2015be705e3aSPierre Jolivet         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
2016be705e3aSPierre Jolivet         /*
2017be705e3aSPierre Jolivet           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
2018be705e3aSPierre Jolivet           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
2019be705e3aSPierre Jolivet          */
2020be705e3aSPierre Jolivet         if (a != 1.0) {
2021be705e3aSPierre Jolivet           ierr = PetscMalloc1(brncols,&vals);CHKERRQ(ierr);
2022be705e3aSPierre Jolivet           for (k=0; k<brncols; k++) vals[k] = a * brcoldata[k];
2023be705e3aSPierre Jolivet           ierr = MatSetValues(Y,1,&row,brncols,cols,vals,ADD_VALUES);CHKERRQ(ierr);
2024be705e3aSPierre Jolivet           ierr = PetscFree(vals);CHKERRQ(ierr);
2025be705e3aSPierre Jolivet         } else {
2026be705e3aSPierre Jolivet           ierr = MatSetValues(Y,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr);
2027be705e3aSPierre Jolivet         }
2028be705e3aSPierre Jolivet         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
2029be705e3aSPierre Jolivet         ierr = PetscFree(cols);CHKERRQ(ierr);
2030be705e3aSPierre Jolivet       }
2031be705e3aSPierre Jolivet       if (D) {
2032be705e3aSPierre Jolivet         ierr = MatDestroy(&D);
2033be705e3aSPierre Jolivet       }
2034be705e3aSPierre Jolivet       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2035be705e3aSPierre Jolivet     }
2036be705e3aSPierre Jolivet     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2037be705e3aSPierre Jolivet     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
2038be705e3aSPierre Jolivet   }
2039be705e3aSPierre Jolivet   ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2040be705e3aSPierre Jolivet   ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2041be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2042be705e3aSPierre Jolivet }
2043be705e3aSPierre Jolivet 
2044be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2045629c3df2SDmitry Karpeev {
2046629c3df2SDmitry Karpeev   PetscErrorCode ierr;
2047629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
2048be705e3aSPierre Jolivet   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart,cstart,cend;
2049b68353e5Sstefano_zampini   PetscMPIInt    size;
2050629c3df2SDmitry Karpeev   Mat            C;
2051629c3df2SDmitry Karpeev 
2052629c3df2SDmitry Karpeev   PetscFunctionBegin;
2053ffc4695bSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRMPI(ierr);
2054b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
2055b68353e5Sstefano_zampini     PetscInt  nf;
2056b68353e5Sstefano_zampini     PetscBool fast;
2057b68353e5Sstefano_zampini 
2058b68353e5Sstefano_zampini     ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr);
2059b68353e5Sstefano_zampini     if (!fast) {
2060b68353e5Sstefano_zampini       ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr);
2061b68353e5Sstefano_zampini     }
2062b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
2063b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
2064b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
2065b68353e5Sstefano_zampini         if (B) {
2066b68353e5Sstefano_zampini           ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr);
206723875855Sstefano_zampini           if (!fast) {
206823875855Sstefano_zampini             PetscBool istrans;
206923875855Sstefano_zampini 
207023875855Sstefano_zampini             ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
207123875855Sstefano_zampini             if (istrans) {
207223875855Sstefano_zampini               Mat Bt;
207323875855Sstefano_zampini 
207423875855Sstefano_zampini               ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
207523875855Sstefano_zampini               ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr);
207623875855Sstefano_zampini             }
2077b68353e5Sstefano_zampini           }
2078b68353e5Sstefano_zampini         }
2079b68353e5Sstefano_zampini       }
2080b68353e5Sstefano_zampini     }
2081b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
2082b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr);
2083b68353e5Sstefano_zampini       if (fast) {
2084b68353e5Sstefano_zampini         PetscInt f,s;
2085b68353e5Sstefano_zampini 
2086b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr);
2087b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2088b68353e5Sstefano_zampini         else {
2089b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr);
2090b68353e5Sstefano_zampini           nf  += f;
2091b68353e5Sstefano_zampini         }
2092b68353e5Sstefano_zampini       }
2093b68353e5Sstefano_zampini     }
2094b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
2095b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr);
2096b68353e5Sstefano_zampini       if (fast) {
2097b68353e5Sstefano_zampini         PetscInt f,s;
2098b68353e5Sstefano_zampini 
2099b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr);
2100b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
2101b68353e5Sstefano_zampini         else {
2102b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr);
2103b68353e5Sstefano_zampini           nf  += f;
2104b68353e5Sstefano_zampini         }
2105b68353e5Sstefano_zampini       }
2106b68353e5Sstefano_zampini     }
2107b68353e5Sstefano_zampini     if (fast) {
2108b68353e5Sstefano_zampini       ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr);
2109b68353e5Sstefano_zampini       PetscFunctionReturn(0);
2110b68353e5Sstefano_zampini     }
2111b68353e5Sstefano_zampini   }
2112629c3df2SDmitry Karpeev   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
2113629c3df2SDmitry Karpeev   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
2114649b366bSFande Kong   ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr);
2115629c3df2SDmitry Karpeev   switch (reuse) {
2116629c3df2SDmitry Karpeev   case MAT_INITIAL_MATRIX:
2117ce94432eSBarry Smith     ierr    = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
2118629c3df2SDmitry Karpeev     ierr    = MatSetType(C,newtype);CHKERRQ(ierr);
2119629c3df2SDmitry Karpeev     ierr    = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
2120629c3df2SDmitry Karpeev     *newmat = C;
2121629c3df2SDmitry Karpeev     break;
2122629c3df2SDmitry Karpeev   case MAT_REUSE_MATRIX:
2123629c3df2SDmitry Karpeev     C = *newmat;
2124629c3df2SDmitry Karpeev     break;
2125ce94432eSBarry Smith   default: SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MatReuse");
2126629c3df2SDmitry Karpeev   }
2127785e854fSJed Brown   ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr);
2128629c3df2SDmitry Karpeev   onnz = dnnz + m;
2129629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
2130629c3df2SDmitry Karpeev     dnnz[k] = 0;
2131629c3df2SDmitry Karpeev     onnz[k] = 0;
2132629c3df2SDmitry Karpeev   }
2133629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
2134629c3df2SDmitry Karpeev     IS             bNis;
2135629c3df2SDmitry Karpeev     PetscInt       bN;
2136629c3df2SDmitry Karpeev     const PetscInt *bNindices;
2137629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
2138629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
2139629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr);
2140629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
2141629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
2142629c3df2SDmitry Karpeev       PetscSF        bmsf;
2143649b366bSFande Kong       PetscSFNode    *iremote;
2144629c3df2SDmitry Karpeev       Mat            B;
2145649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
2146629c3df2SDmitry Karpeev       const PetscInt *bmindices;
2147629c3df2SDmitry Karpeev       B = nest->m[i][j];
2148629c3df2SDmitry Karpeev       if (!B) continue;
2149629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
2150629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2151ce94432eSBarry Smith       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr);
2152649b366bSFande Kong       ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr);
2153649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr);
2154649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr);
2155649b366bSFande Kong       for (k = 0; k < bm; ++k){
2156649b366bSFande Kong         sub_dnnz[k] = 0;
2157649b366bSFande Kong         sub_onnz[k] = 0;
2158649b366bSFande Kong       }
2159629c3df2SDmitry Karpeev       /*
2160629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
2161629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
2162629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
2163629c3df2SDmitry Karpeev        */
216483b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
2165629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
2166131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
2167629c3df2SDmitry Karpeev         const PetscInt *brcols;
2168a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
2169131c27b5Sprj-         PetscMPIInt    rowowner = 0;
2170629c3df2SDmitry Karpeev         ierr      = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr);
2171649b366bSFande Kong         /* how many roots  */
2172649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
2173649b366bSFande Kong         /* get nonzero pattern */
217483b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2175629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
2176629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
2177649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
2178649b366bSFande Kong             sub_dnnz[br]++;
2179649b366bSFande Kong           } else {
2180649b366bSFande Kong             sub_onnz[br]++;
2181649b366bSFande Kong           }
2182629c3df2SDmitry Karpeev         }
218383b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
2184629c3df2SDmitry Karpeev       }
2185629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
2186629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
2187649b366bSFande Kong       ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr);
2188649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2189649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
2190649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2191649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
2192649b366bSFande Kong       ierr = PetscFree(sub_dnnz);CHKERRQ(ierr);
2193649b366bSFande Kong       ierr = PetscFree(sub_onnz);CHKERRQ(ierr);
2194629c3df2SDmitry Karpeev       ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr);
2195629c3df2SDmitry Karpeev     }
219622d28d08SBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
2197629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
219865a4a0a3Sstefano_zampini   }
219965a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
220065a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
220165a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
220265a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
2203629c3df2SDmitry Karpeev   }
2204629c3df2SDmitry Karpeev   ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr);
2205629c3df2SDmitry Karpeev   ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr);
2206629c3df2SDmitry Karpeev   ierr = PetscFree(dnnz);CHKERRQ(ierr);
2207be705e3aSPierre Jolivet   ierr = MatAXPY_Dense_Nest(C,1.0,A);CHKERRQ(ierr);
2208be705e3aSPierre Jolivet   PetscFunctionReturn(0);
2209be705e3aSPierre Jolivet }
2210629c3df2SDmitry Karpeev 
2211be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_Dense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
2212be705e3aSPierre Jolivet {
2213629c3df2SDmitry Karpeev   Mat            B;
2214be705e3aSPierre Jolivet   PetscInt       m,n,M,N;
2215be705e3aSPierre Jolivet   PetscErrorCode ierr;
2216be705e3aSPierre Jolivet 
2217be705e3aSPierre Jolivet   PetscFunctionBegin;
2218be705e3aSPierre Jolivet   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
2219be705e3aSPierre Jolivet   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
2220be705e3aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
2221be705e3aSPierre Jolivet     B = *newmat;
2222be705e3aSPierre Jolivet     ierr = MatZeroEntries(B);CHKERRQ(ierr);
2223be705e3aSPierre Jolivet   } else {
2224be705e3aSPierre Jolivet     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),m,PETSC_DECIDE,M,N,NULL,&B);CHKERRQ(ierr);
2225629c3df2SDmitry Karpeev   }
2226be705e3aSPierre Jolivet   ierr = MatAXPY_Dense_Nest(B,1.0,A);CHKERRQ(ierr);
2227be705e3aSPierre Jolivet   if (reuse == MAT_INPLACE_MATRIX) {
2228be705e3aSPierre Jolivet     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
2229be705e3aSPierre Jolivet   } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B;
2230629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
2231629c3df2SDmitry Karpeev }
2232629c3df2SDmitry Karpeev 
22338b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
22348b7d3b4bSBarry Smith {
22358b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
22363c6db4c4SPierre Jolivet   MatOperation   opAdd;
22378b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
22388b7d3b4bSBarry Smith   PetscBool      flg;
223952c5f739Sprj-   PetscErrorCode ierr;
224052c5f739Sprj-   PetscFunctionBegin;
22418b7d3b4bSBarry Smith 
224252c5f739Sprj-   *has = PETSC_FALSE;
22433c6db4c4SPierre Jolivet   if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) {
22443c6db4c4SPierre Jolivet     opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD);
22458b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
22468b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
22478b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
22483c6db4c4SPierre Jolivet         ierr = MatHasOperation(bA->m[i][j],opAdd,&flg);CHKERRQ(ierr);
22498b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
22508b7d3b4bSBarry Smith       }
22518b7d3b4bSBarry Smith     }
22528b7d3b4bSBarry Smith   }
22533c6db4c4SPierre Jolivet   if (((void**)mat->ops)[op]) *has = PETSC_TRUE;
22548b7d3b4bSBarry Smith   PetscFunctionReturn(0);
22558b7d3b4bSBarry Smith }
22568b7d3b4bSBarry Smith 
2257659c6bb0SJed Brown /*MC
2258659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
2259659c6bb0SJed Brown 
2260659c6bb0SJed Brown   Level: intermediate
2261659c6bb0SJed Brown 
2262659c6bb0SJed Brown   Notes:
2263659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
2264659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
2265950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
2266659c6bb0SJed Brown 
22678b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
22688b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
22698b7d3b4bSBarry Smith   than the nest matrix.
22708b7d3b4bSBarry Smith 
227179798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
227279798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
227379798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
2274659c6bb0SJed Brown M*/
22758cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
2276c8883902SJed Brown {
2277c8883902SJed Brown   Mat_Nest       *s;
2278c8883902SJed Brown   PetscErrorCode ierr;
2279c8883902SJed Brown 
2280c8883902SJed Brown   PetscFunctionBegin;
2281b00a9115SJed Brown   ierr    = PetscNewLog(A,&s);CHKERRQ(ierr);
2282c8883902SJed Brown   A->data = (void*)s;
2283e7c19651SJed Brown 
2284e7c19651SJed Brown   s->nr            = -1;
2285e7c19651SJed Brown   s->nc            = -1;
22860298fd71SBarry Smith   s->m             = NULL;
2287e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
2288c8883902SJed Brown 
2289c8883902SJed Brown   ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr);
229026fbe8dcSKarl Rupp 
2291c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
22929194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2293c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
22949194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2295f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2296c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2297c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2298c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2299c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
23006e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2301c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
23027dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2303c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2304c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2305f4259b30SLisandro Dalcin   A->ops->getvecs               = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2306c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2307c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2308429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2309429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2310a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2311a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
231213135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2313f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
23148b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2315381b8e50SStefano Zampini   A->ops->missingdiagonal       = MatMissingDiagonal_Nest;
2316c8883902SJed Brown 
2317f4259b30SLisandro Dalcin   A->spptr        = NULL;
2318c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2319c8883902SJed Brown 
2320c8883902SJed Brown   /* expose Nest api's */
2321bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest);CHKERRQ(ierr);
2322bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest);CHKERRQ(ierr);
2323bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest);CHKERRQ(ierr);
2324bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest);CHKERRQ(ierr);
2325bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest);CHKERRQ(ierr);
2326bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest);CHKERRQ(ierr);
2327bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest);CHKERRQ(ierr);
2328bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest);CHKERRQ(ierr);
23290899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
23300899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
233183b1a929SMark Adams   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ);CHKERRQ(ierr);
23325e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS);CHKERRQ(ierr);
2333be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",MatConvert_Nest_Dense);CHKERRQ(ierr);
2334be705e3aSPierre Jolivet   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",MatConvert_Nest_Dense);CHKERRQ(ierr);
23354222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
23364222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
23374222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr);
2338c8883902SJed Brown 
2339c8883902SJed Brown   ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr);
2340c8883902SJed Brown   PetscFunctionReturn(0);
2341c8883902SJed Brown }
2342