xref: /petsc/src/mat/impls/nest/matnest.c (revision 79798668b58fd54383718865ba3bcf39bec27d06)
1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I   "petscmat.h"   I*/
2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h>
30c312b8eSJed Brown #include <petscsf.h>
4d8588912SDave May 
5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]);
62a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left);
75e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*);
8c8883902SJed Brown 
9d8588912SDave May /* private functions */
108188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N)
11d8588912SDave May {
12d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
138188e55aSJed Brown   PetscInt       i,j;
14d8588912SDave May   PetscErrorCode ierr;
15d8588912SDave May 
16d8588912SDave May   PetscFunctionBegin;
178188e55aSJed Brown   *m = *n = *M = *N = 0;
188188e55aSJed Brown   for (i=0; i<bA->nr; i++) {  /* rows */
198188e55aSJed Brown     PetscInt sm,sM;
208188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr);
218188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr);
228188e55aSJed Brown     *m  += sm;
238188e55aSJed Brown     *M  += sM;
24d8588912SDave May   }
258188e55aSJed Brown   for (j=0; j<bA->nc; j++) {  /* cols */
268188e55aSJed Brown     PetscInt sn,sN;
278188e55aSJed Brown     ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr);
288188e55aSJed Brown     ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr);
298188e55aSJed Brown     *n  += sn;
308188e55aSJed Brown     *N  += sN;
31d8588912SDave May   }
32d8588912SDave May   PetscFunctionReturn(0);
33d8588912SDave May }
34d8588912SDave May 
35d8588912SDave May /* operations */
36207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y)
37d8588912SDave May {
38d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
39207556f9SJed Brown   Vec            *bx = bA->right,*by = bA->left;
40207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
41d8588912SDave May   PetscErrorCode ierr;
42d8588912SDave May 
43d8588912SDave May   PetscFunctionBegin;
44207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
45207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
46207556f9SJed Brown   for (i=0; i<nr; i++) {
47d8588912SDave May     ierr = VecZeroEntries(by[i]);CHKERRQ(ierr);
48207556f9SJed Brown     for (j=0; j<nc; j++) {
49207556f9SJed Brown       if (!bA->m[i][j]) continue;
50d8588912SDave May       /* y[i] <- y[i] + A[i][j] * x[j] */
51d8588912SDave May       ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr);
52d8588912SDave May     }
53d8588912SDave May   }
54207556f9SJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);}
55207556f9SJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
56d8588912SDave May   PetscFunctionReturn(0);
57d8588912SDave May }
58d8588912SDave May 
599194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z)
609194d70fSJed Brown {
619194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
629194d70fSJed Brown   Vec            *bx = bA->right,*bz = bA->left;
639194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
649194d70fSJed Brown   PetscErrorCode ierr;
659194d70fSJed Brown 
669194d70fSJed Brown   PetscFunctionBegin;
679194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
689194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
699194d70fSJed Brown   for (i=0; i<nr; i++) {
709194d70fSJed Brown     if (y != z) {
719194d70fSJed Brown       Vec by;
729194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
739194d70fSJed Brown       ierr = VecCopy(by,bz[i]);CHKERRQ(ierr);
74336d21e7SJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr);
759194d70fSJed Brown     }
769194d70fSJed Brown     for (j=0; j<nc; j++) {
779194d70fSJed Brown       if (!bA->m[i][j]) continue;
789194d70fSJed Brown       /* y[i] <- y[i] + A[i][j] * x[j] */
799194d70fSJed Brown       ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr);
809194d70fSJed Brown     }
819194d70fSJed Brown   }
829194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);}
839194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);}
849194d70fSJed Brown   PetscFunctionReturn(0);
859194d70fSJed Brown }
869194d70fSJed Brown 
8752c5f739Sprj- typedef struct {
8852c5f739Sprj-   Mat          *workC;    /* array of Mat with specific containers depending on the underlying MatMatMult implementation */
8952c5f739Sprj-   PetscScalar  *tarray;   /* buffer for storing all temporary products A[i][j] B[j] */
9052c5f739Sprj-   PetscInt     *dm,*dn,k; /* displacements and number of submatrices */
9152c5f739Sprj- } Nest_Dense;
9252c5f739Sprj- 
9352c5f739Sprj- PETSC_INTERN PetscErrorCode MatMatMultNumeric_Nest_Dense(Mat A,Mat B,Mat C)
9452c5f739Sprj- {
9552c5f739Sprj-   Mat_Nest          *bA = (Mat_Nest*)A->data;
9652c5f739Sprj-   PetscContainer    container;
9752c5f739Sprj-   Nest_Dense        *contents;
9852c5f739Sprj-   Mat               viewB,viewC,seq;
9952c5f739Sprj-   const PetscScalar *barray;
10052c5f739Sprj-   PetscScalar       *carray;
10152c5f739Sprj-   PetscInt          i,j,M,N,nr = bA->nr,nc = bA->nc,ldb,ldc;
10252c5f739Sprj-   PetscErrorCode    ierr;
10352c5f739Sprj- 
10452c5f739Sprj-   PetscFunctionBegin;
10552c5f739Sprj-   ierr = PetscObjectQuery((PetscObject)C,"workC",(PetscObject*)&container);CHKERRQ(ierr);
10652c5f739Sprj-   if (!container) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Container does not exist");
10752c5f739Sprj-   ierr = PetscContainerGetPointer(container,(void**)&contents);CHKERRQ(ierr);
10852c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
10952c5f739Sprj-   ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr);
11052c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
11152c5f739Sprj-   ierr = MatZeroEntries(C);CHKERRQ(ierr);
11252c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
11352c5f739Sprj-   ierr = MatDenseGetArray(C,&carray);CHKERRQ(ierr);
11452c5f739Sprj-   for (i=0; i<nr; i++) {
11552c5f739Sprj-     ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr);
11652c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr);
11752c5f739Sprj-     ierr = MatDenseGetLocalMatrix(viewC,&seq);CHKERRQ(ierr);
11852c5f739Sprj-     ierr = MatSeqDenseSetLDA(seq,ldc);CHKERRQ(ierr);
11952c5f739Sprj-     for (j=0; j<nc; j++) {
12052c5f739Sprj-       if (!bA->m[i][j]) continue;
12152c5f739Sprj-       ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
12252c5f739Sprj-       ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
12352c5f739Sprj-       ierr = MatDenseGetLocalMatrix(viewB,&seq);CHKERRQ(ierr);
12452c5f739Sprj-       ierr = MatSeqDenseSetLDA(seq,ldb);CHKERRQ(ierr);
12552c5f739Sprj-       /* workC <- A[i][j] * B[j] */
12652c5f739Sprj-       ierr = MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]);CHKERRQ(ierr);
12752c5f739Sprj-       ierr = MatDestroy(&viewB);CHKERRQ(ierr);
12852c5f739Sprj-        /* C[i] <- workC + C[i] */
12952c5f739Sprj-       ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr);
13052c5f739Sprj-     }
13152c5f739Sprj-     ierr = MatDestroy(&viewC);CHKERRQ(ierr);
13252c5f739Sprj-   }
13352c5f739Sprj-   ierr = MatDenseRestoreArray(C,&carray);CHKERRQ(ierr);
13452c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
13552c5f739Sprj-   PetscFunctionReturn(0);
13652c5f739Sprj- }
13752c5f739Sprj- 
13852c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx)
13952c5f739Sprj- {
14052c5f739Sprj-   Nest_Dense     *contents = (Nest_Dense*)ctx;
14152c5f739Sprj-   PetscInt       i;
14252c5f739Sprj-   PetscErrorCode ierr;
14352c5f739Sprj- 
14452c5f739Sprj-   PetscFunctionBegin;
14552c5f739Sprj-   ierr = PetscFree(contents->tarray);CHKERRQ(ierr);
14652c5f739Sprj-   for (i=0; i<contents->k; i++) {
14752c5f739Sprj-     ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr);
14852c5f739Sprj-   }
14952c5f739Sprj-   ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr);
15052c5f739Sprj-   ierr = PetscFree(contents);CHKERRQ(ierr);
15152c5f739Sprj-   PetscFunctionReturn(0);
15252c5f739Sprj- }
15352c5f739Sprj- 
15452c5f739Sprj- PETSC_INTERN PetscErrorCode MatMatMultSymbolic_Nest_Dense(Mat A,Mat B,PetscReal fill,Mat *C)
15552c5f739Sprj- {
15652c5f739Sprj-   Mat_Nest          *bA = (Mat_Nest*)A->data;
15752c5f739Sprj-   Mat               viewB,viewSeq;
15852c5f739Sprj-   const PetscScalar *barray;
15952c5f739Sprj-   PetscInt          i,j,M,N,m,nr = bA->nr,nc = bA->nc,maxm = 0,ldb;
16052c5f739Sprj-   PetscContainer    container;
16152c5f739Sprj-   Nest_Dense        *contents;
16252c5f739Sprj-   PetscErrorCode    ierr;
16352c5f739Sprj- 
16452c5f739Sprj-   PetscFunctionBegin;
16552c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
16652c5f739Sprj-   if (!(*C)) {
16752c5f739Sprj-     ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr);
16852c5f739Sprj-     ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr);
16952c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),m,PETSC_DECIDE,M,N,NULL,C);CHKERRQ(ierr);
17052c5f739Sprj-   } else {
17152c5f739Sprj-     if ((*C)->rmap->n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Matrix local row dimensions are incompatible, %D != %D",(*C)->rmap->n,A->rmap->n);
17252c5f739Sprj-     if ((*C)->cmap->n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Matrix local column dimensions are incompatible, %D != %D",(*C)->cmap->n,B->cmap->n);
17352c5f739Sprj-   }
17452c5f739Sprj- 
17552c5f739Sprj-   ierr = PetscNew(&contents);CHKERRQ(ierr);
17652c5f739Sprj-   ierr = PetscContainerCreate(PetscObjectComm((PetscObject)A),&container);CHKERRQ(ierr);
17752c5f739Sprj-   ierr = PetscContainerSetPointer(container,contents);CHKERRQ(ierr);
17852c5f739Sprj-   ierr = PetscContainerSetUserDestroy(container,MatNest_DenseDestroy);CHKERRQ(ierr);
17952c5f739Sprj-   ierr = PetscObjectCompose((PetscObject)*C,"workC",(PetscObject)container);CHKERRQ(ierr);
18052c5f739Sprj-   ierr = PetscContainerDestroy(&container);CHKERRQ(ierr);
18152c5f739Sprj-   ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr);
18252c5f739Sprj-   contents->k = nr*nc;
18352c5f739Sprj-   for (i=0; i<nr; i++) {
18452c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr);
18552c5f739Sprj-     maxm = PetscMax(maxm,contents->dm[i+1]);
18652c5f739Sprj-     contents->dm[i+1] += contents->dm[i];
18752c5f739Sprj-   }
18852c5f739Sprj-   for (i=0; i<nc; i++) {
18952c5f739Sprj-     ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr);
19052c5f739Sprj-     contents->dn[i+1] += contents->dn[i];
19152c5f739Sprj-   }
19252c5f739Sprj-   ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr);
19352c5f739Sprj-   ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr);
19452c5f739Sprj-   ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr);
19552c5f739Sprj-   ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr);
19652c5f739Sprj-   /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */
19752c5f739Sprj-   for (j=0; j<nc; j++) {
19852c5f739Sprj-     ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr);
19952c5f739Sprj-     ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr);
20052c5f739Sprj-     ierr = MatDenseGetLocalMatrix(viewB,&viewSeq);CHKERRQ(ierr);
20152c5f739Sprj-     ierr = MatSeqDenseSetLDA(viewSeq,ldb);CHKERRQ(ierr);
20252c5f739Sprj-     for (i=0; i<nr; i++) {
20352c5f739Sprj-       if (!bA->m[i][j]) continue;
20452c5f739Sprj-       /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */
20552c5f739Sprj-       ierr = MatMatMultSymbolic(bA->m[i][j],viewB,fill,contents->workC + i*nc + j);CHKERRQ(ierr);
20652c5f739Sprj-       ierr = MatDenseGetLocalMatrix(contents->workC[i*nc + j],&viewSeq);CHKERRQ(ierr);
20752c5f739Sprj-       /* free the memory allocated in MatMatMultSymbolic, since tarray will be shared by all Mat */
20852c5f739Sprj-       ierr = MatSeqDenseSetPreallocation(viewSeq,contents->tarray);CHKERRQ(ierr);
20952c5f739Sprj-     }
21052c5f739Sprj-     ierr = MatDestroy(&viewB);CHKERRQ(ierr);
21152c5f739Sprj-   }
21252c5f739Sprj-   ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr);
21352c5f739Sprj- 
21452c5f739Sprj-   (*C)->ops->matmultnumeric = MatMatMultNumeric_Nest_Dense;
21552c5f739Sprj-   PetscFunctionReturn(0);
21652c5f739Sprj- }
21752c5f739Sprj- 
21852c5f739Sprj- PETSC_INTERN PetscErrorCode MatMatMult_Nest_Dense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C)
21952c5f739Sprj- {
22052c5f739Sprj-   PetscErrorCode ierr;
22152c5f739Sprj- 
22252c5f739Sprj-   PetscFunctionBegin;
22352c5f739Sprj-   if (scall == MAT_INITIAL_MATRIX) {
22452c5f739Sprj-     *C = NULL;
22552c5f739Sprj-     ierr = PetscLogEventBegin(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr);
22652c5f739Sprj-     ierr = MatMatMultSymbolic_Nest_Dense(A,B,fill,C);CHKERRQ(ierr);
22752c5f739Sprj-     ierr = PetscLogEventEnd(MAT_MatMultSymbolic,A,B,0,0);CHKERRQ(ierr);
22852c5f739Sprj-   }
22952c5f739Sprj-   ierr = PetscLogEventBegin(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr);
23052c5f739Sprj-   ierr = MatMatMultNumeric_Nest_Dense(A,B,*C);CHKERRQ(ierr);
23152c5f739Sprj-   ierr = PetscLogEventEnd(MAT_MatMultNumeric,A,B,0,0);CHKERRQ(ierr);
23252c5f739Sprj-   PetscFunctionReturn(0);
23352c5f739Sprj- }
23452c5f739Sprj- 
235207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y)
236d8588912SDave May {
237d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
238207556f9SJed Brown   Vec            *bx = bA->left,*by = bA->right;
239207556f9SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
240d8588912SDave May   PetscErrorCode ierr;
241d8588912SDave May 
242d8588912SDave May   PetscFunctionBegin;
243609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
244609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
245207556f9SJed Brown   for (j=0; j<nc; j++) {
246609e31cbSJed Brown     ierr = VecZeroEntries(by[j]);CHKERRQ(ierr);
247609e31cbSJed Brown     for (i=0; i<nr; i++) {
2486c75ac25SJed Brown       if (!bA->m[i][j]) continue;
249609e31cbSJed Brown       /* y[j] <- y[j] + (A[i][j])^T * x[i] */
250609e31cbSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr);
251d8588912SDave May     }
252d8588912SDave May   }
253609e31cbSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
254609e31cbSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);}
255d8588912SDave May   PetscFunctionReturn(0);
256d8588912SDave May }
257d8588912SDave May 
2589194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z)
2599194d70fSJed Brown {
2609194d70fSJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
2619194d70fSJed Brown   Vec            *bx = bA->left,*bz = bA->right;
2629194d70fSJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
2639194d70fSJed Brown   PetscErrorCode ierr;
2649194d70fSJed Brown 
2659194d70fSJed Brown   PetscFunctionBegin;
2669194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
2679194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
2689194d70fSJed Brown   for (j=0; j<nc; j++) {
2699194d70fSJed Brown     if (y != z) {
2709194d70fSJed Brown       Vec by;
2719194d70fSJed Brown       ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
2729194d70fSJed Brown       ierr = VecCopy(by,bz[j]);CHKERRQ(ierr);
2739194d70fSJed Brown       ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr);
2749194d70fSJed Brown     }
2759194d70fSJed Brown     for (i=0; i<nr; i++) {
2766c75ac25SJed Brown       if (!bA->m[i][j]) continue;
2779194d70fSJed Brown       /* z[j] <- y[j] + (A[i][j])^T * x[i] */
2789194d70fSJed Brown       ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr);
2799194d70fSJed Brown     }
2809194d70fSJed Brown   }
2819194d70fSJed Brown   for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);}
2829194d70fSJed Brown   for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);}
2839194d70fSJed Brown   PetscFunctionReturn(0);
2849194d70fSJed Brown }
2859194d70fSJed Brown 
286f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B)
287f8170845SAlex Fikl {
288f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data, *bC;
289f8170845SAlex Fikl   Mat            C;
290f8170845SAlex Fikl   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
291f8170845SAlex Fikl   PetscErrorCode ierr;
292f8170845SAlex Fikl 
293f8170845SAlex Fikl   PetscFunctionBegin;
294cf37664fSBarry Smith   if (reuse == MAT_INPLACE_MATRIX && nr != nc) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place");
295f8170845SAlex Fikl 
296cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) {
297f8170845SAlex Fikl     Mat *subs;
298f8170845SAlex Fikl     IS  *is_row,*is_col;
299f8170845SAlex Fikl 
300f8170845SAlex Fikl     ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr);
301f8170845SAlex Fikl     ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr);
302f8170845SAlex Fikl     ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr);
303cf37664fSBarry Smith     if (reuse == MAT_INPLACE_MATRIX) {
304ddeb9bd8SAlex Fikl       for (i=0; i<nr; i++) {
305ddeb9bd8SAlex Fikl         for (j=0; j<nc; j++) {
306ddeb9bd8SAlex Fikl           subs[i + nr * j] = bA->m[i][j];
307ddeb9bd8SAlex Fikl         }
308ddeb9bd8SAlex Fikl       }
309ddeb9bd8SAlex Fikl     }
310ddeb9bd8SAlex Fikl 
311f8170845SAlex Fikl     ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr);
312f8170845SAlex Fikl     ierr = PetscFree(subs);CHKERRQ(ierr);
3133d994f23SBarry Smith     ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr);
314f8170845SAlex Fikl   } else {
315f8170845SAlex Fikl     C = *B;
316f8170845SAlex Fikl   }
317f8170845SAlex Fikl 
318f8170845SAlex Fikl   bC = (Mat_Nest*)C->data;
319f8170845SAlex Fikl   for (i=0; i<nr; i++) {
320f8170845SAlex Fikl     for (j=0; j<nc; j++) {
321f8170845SAlex Fikl       if (bA->m[i][j]) {
322f8170845SAlex Fikl         ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr);
323f8170845SAlex Fikl       } else {
324f8170845SAlex Fikl         bC->m[j][i] = NULL;
325f8170845SAlex Fikl       }
326f8170845SAlex Fikl     }
327f8170845SAlex Fikl   }
328f8170845SAlex Fikl 
329cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) {
330f8170845SAlex Fikl     *B = C;
331f8170845SAlex Fikl   } else {
332f8170845SAlex Fikl     ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr);
333f8170845SAlex Fikl   }
334f8170845SAlex Fikl   PetscFunctionReturn(0);
335f8170845SAlex Fikl }
336f8170845SAlex Fikl 
337e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list)
338e2d7f03fSJed Brown {
339e2d7f03fSJed Brown   PetscErrorCode ierr;
340e2d7f03fSJed Brown   IS             *lst = *list;
341e2d7f03fSJed Brown   PetscInt       i;
342e2d7f03fSJed Brown 
343e2d7f03fSJed Brown   PetscFunctionBegin;
344e2d7f03fSJed Brown   if (!lst) PetscFunctionReturn(0);
3456bf464f9SBarry Smith   for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);}
346e2d7f03fSJed Brown   ierr  = PetscFree(lst);CHKERRQ(ierr);
3470298fd71SBarry Smith   *list = NULL;
348e2d7f03fSJed Brown   PetscFunctionReturn(0);
349e2d7f03fSJed Brown }
350e2d7f03fSJed Brown 
351207556f9SJed Brown static PetscErrorCode MatDestroy_Nest(Mat A)
352d8588912SDave May {
353d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
354d8588912SDave May   PetscInt       i,j;
355d8588912SDave May   PetscErrorCode ierr;
356d8588912SDave May 
357d8588912SDave May   PetscFunctionBegin;
358d8588912SDave May   /* release the matrices and the place holders */
359e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr);
360e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr);
361e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
362e2d7f03fSJed Brown   ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
363d8588912SDave May 
364d8588912SDave May   ierr = PetscFree(vs->row_len);CHKERRQ(ierr);
365d8588912SDave May   ierr = PetscFree(vs->col_len);CHKERRQ(ierr);
366d8588912SDave May 
367207556f9SJed Brown   ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr);
368207556f9SJed Brown 
369d8588912SDave May   /* release the matrices and the place holders */
370d8588912SDave May   if (vs->m) {
371d8588912SDave May     for (i=0; i<vs->nr; i++) {
372d8588912SDave May       for (j=0; j<vs->nc; j++) {
3736bf464f9SBarry Smith         ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr);
374d8588912SDave May       }
375d8588912SDave May       ierr = PetscFree(vs->m[i]);CHKERRQ(ierr);
376d8588912SDave May     }
377d8588912SDave May     ierr = PetscFree(vs->m);CHKERRQ(ierr);
378d8588912SDave May   }
379bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
380d8588912SDave May 
381bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",0);CHKERRQ(ierr);
382bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",0);CHKERRQ(ierr);
383bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",0);CHKERRQ(ierr);
384bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",0);CHKERRQ(ierr);
385bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",0);CHKERRQ(ierr);
386bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",0);CHKERRQ(ierr);
387bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",0);CHKERRQ(ierr);
388bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",0);CHKERRQ(ierr);
3890899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",0);CHKERRQ(ierr);
3900899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",0);CHKERRQ(ierr);
3915e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",0);CHKERRQ(ierr);
3925e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",0);CHKERRQ(ierr);
39352c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_mpidense_C",0);CHKERRQ(ierr);
39452c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_seqdense_C",0);CHKERRQ(ierr);
39552c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_dense_C",0);CHKERRQ(ierr);
396d8588912SDave May   PetscFunctionReturn(0);
397d8588912SDave May }
398d8588912SDave May 
399207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type)
400d8588912SDave May {
401d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
402d8588912SDave May   PetscInt       i,j;
403d8588912SDave May   PetscErrorCode ierr;
404d8588912SDave May 
405d8588912SDave May   PetscFunctionBegin;
406d8588912SDave May   for (i=0; i<vs->nr; i++) {
407d8588912SDave May     for (j=0; j<vs->nc; j++) {
408e7c19651SJed Brown       if (vs->m[i][j]) {
409e7c19651SJed Brown         ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr);
410e7c19651SJed Brown         if (!vs->splitassembly) {
411e7c19651SJed Brown           /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested
412e7c19651SJed Brown            * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was
413e7c19651SJed Brown            * already performing an assembly, but the result would by more complicated and appears to offer less
414e7c19651SJed Brown            * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an
415e7c19651SJed Brown            * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives".
416e7c19651SJed Brown            */
417e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
418e7c19651SJed Brown         }
419e7c19651SJed Brown       }
420d8588912SDave May     }
421d8588912SDave May   }
422d8588912SDave May   PetscFunctionReturn(0);
423d8588912SDave May }
424d8588912SDave May 
425207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type)
426d8588912SDave May {
427d8588912SDave May   Mat_Nest       *vs = (Mat_Nest*)A->data;
428d8588912SDave May   PetscInt       i,j;
429d8588912SDave May   PetscErrorCode ierr;
430d8588912SDave May 
431d8588912SDave May   PetscFunctionBegin;
432d8588912SDave May   for (i=0; i<vs->nr; i++) {
433d8588912SDave May     for (j=0; j<vs->nc; j++) {
434e7c19651SJed Brown       if (vs->m[i][j]) {
435e7c19651SJed Brown         if (vs->splitassembly) {
436e7c19651SJed Brown           ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr);
437e7c19651SJed Brown         }
438e7c19651SJed Brown       }
439d8588912SDave May     }
440d8588912SDave May   }
441d8588912SDave May   PetscFunctionReturn(0);
442d8588912SDave May }
443d8588912SDave May 
444f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B)
445d8588912SDave May {
446207556f9SJed Brown   PetscErrorCode ierr;
447f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
448f349c1fdSJed Brown   PetscInt       j;
449f349c1fdSJed Brown   Mat            sub;
450d8588912SDave May 
451d8588912SDave May   PetscFunctionBegin;
4520298fd71SBarry Smith   sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */
453f349c1fdSJed Brown   for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j];
4544994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
455f349c1fdSJed Brown   *B = sub;
456f349c1fdSJed Brown   PetscFunctionReturn(0);
457d8588912SDave May }
458d8588912SDave May 
459f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B)
460f349c1fdSJed Brown {
461207556f9SJed Brown   PetscErrorCode ierr;
462f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
463f349c1fdSJed Brown   PetscInt       i;
464f349c1fdSJed Brown   Mat            sub;
465f349c1fdSJed Brown 
466f349c1fdSJed Brown   PetscFunctionBegin;
4670298fd71SBarry Smith   sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */
468f349c1fdSJed Brown   for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col];
4694994cf47SJed Brown   if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);}       /* Ensure that the sizes are available */
470f349c1fdSJed Brown   *B = sub;
471f349c1fdSJed Brown   PetscFunctionReturn(0);
472d8588912SDave May }
473d8588912SDave May 
474f349c1fdSJed Brown static PetscErrorCode MatNestFindIS(Mat A,PetscInt n,const IS list[],IS is,PetscInt *found)
475f349c1fdSJed Brown {
476f349c1fdSJed Brown   PetscErrorCode ierr;
477f349c1fdSJed Brown   PetscInt       i;
478f349c1fdSJed Brown   PetscBool      flg;
479f349c1fdSJed Brown 
480f349c1fdSJed Brown   PetscFunctionBegin;
481f349c1fdSJed Brown   PetscValidPointer(list,3);
482f349c1fdSJed Brown   PetscValidHeaderSpecific(is,IS_CLASSID,4);
483f349c1fdSJed Brown   PetscValidIntPointer(found,5);
484f349c1fdSJed Brown   *found = -1;
485f349c1fdSJed Brown   for (i=0; i<n; i++) {
486207556f9SJed Brown     if (!list[i]) continue;
487f349c1fdSJed Brown     ierr = ISEqual(list[i],is,&flg);CHKERRQ(ierr);
488f349c1fdSJed Brown     if (flg) {
489f349c1fdSJed Brown       *found = i;
490f349c1fdSJed Brown       PetscFunctionReturn(0);
491f349c1fdSJed Brown     }
492f349c1fdSJed Brown   }
493ce94432eSBarry Smith   SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set");
494f349c1fdSJed Brown   PetscFunctionReturn(0);
495f349c1fdSJed Brown }
496f349c1fdSJed Brown 
4978188e55aSJed Brown /* Get a block row as a new MatNest */
4988188e55aSJed Brown static PetscErrorCode MatNestGetRow(Mat A,PetscInt row,Mat *B)
4998188e55aSJed Brown {
5008188e55aSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
5018188e55aSJed Brown   char           keyname[256];
5028188e55aSJed Brown   PetscErrorCode ierr;
5038188e55aSJed Brown 
5048188e55aSJed Brown   PetscFunctionBegin;
5050298fd71SBarry Smith   *B   = NULL;
5068caf3d72SBarry Smith   ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestRow_%D",row);CHKERRQ(ierr);
5078188e55aSJed Brown   ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr);
5088188e55aSJed Brown   if (*B) PetscFunctionReturn(0);
5098188e55aSJed Brown 
510ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),1,NULL,vs->nc,vs->isglobal.col,vs->m[row],B);CHKERRQ(ierr);
51126fbe8dcSKarl Rupp 
5128188e55aSJed Brown   (*B)->assembled = A->assembled;
51326fbe8dcSKarl Rupp 
5148188e55aSJed Brown   ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr);
5158188e55aSJed Brown   ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */
5168188e55aSJed Brown   PetscFunctionReturn(0);
5178188e55aSJed Brown }
5188188e55aSJed Brown 
519f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B)
520f349c1fdSJed Brown {
521f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
5228188e55aSJed Brown   PetscErrorCode ierr;
5236b3a5b13SJed Brown   PetscInt       row,col;
524e072481dSJed Brown   PetscBool      same,isFullCol,isFullColGlobal;
525f349c1fdSJed Brown 
526f349c1fdSJed Brown   PetscFunctionBegin;
5278188e55aSJed Brown   /* Check if full column space. This is a hack */
5288188e55aSJed Brown   isFullCol = PETSC_FALSE;
529251f4c67SDmitry Karpeev   ierr      = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&same);CHKERRQ(ierr);
5308188e55aSJed Brown   if (same) {
53177019fcaSJed Brown     PetscInt n,first,step,i,an,am,afirst,astep;
5328188e55aSJed Brown     ierr      = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr);
5338188e55aSJed Brown     ierr      = ISGetLocalSize(iscol,&n);CHKERRQ(ierr);
53477019fcaSJed Brown     isFullCol = PETSC_TRUE;
53505ce4453SJed Brown     for (i=0,an=A->cmap->rstart; i<vs->nc; i++) {
53677019fcaSJed Brown       ierr = ISStrideGetInfo(is->col[i],&afirst,&astep);CHKERRQ(ierr);
53777019fcaSJed Brown       ierr = ISGetLocalSize(is->col[i],&am);CHKERRQ(ierr);
53877019fcaSJed Brown       if (afirst != an || astep != step) isFullCol = PETSC_FALSE;
53977019fcaSJed Brown       an += am;
54077019fcaSJed Brown     }
54105ce4453SJed Brown     if (an != A->cmap->rstart+n) isFullCol = PETSC_FALSE;
5428188e55aSJed Brown   }
543b2566f29SBarry Smith   ierr = MPIU_Allreduce(&isFullCol,&isFullColGlobal,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)iscol));CHKERRQ(ierr);
5448188e55aSJed Brown 
545427230ceSLisandro Dalcin   if (isFullColGlobal && vs->nc > 1) {
5468188e55aSJed Brown     PetscInt row;
5478188e55aSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
5488188e55aSJed Brown     ierr = MatNestGetRow(A,row,B);CHKERRQ(ierr);
5498188e55aSJed Brown   } else {
550f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nr,is->row,isrow,&row);CHKERRQ(ierr);
551f349c1fdSJed Brown     ierr = MatNestFindIS(A,vs->nc,is->col,iscol,&col);CHKERRQ(ierr);
552b6480e04SStefano Zampini     if (!vs->m[row][col]) {
553b6480e04SStefano Zampini       PetscInt lr,lc;
554b6480e04SStefano Zampini 
555b6480e04SStefano Zampini       ierr = MatCreate(PetscObjectComm((PetscObject)A),&vs->m[row][col]);CHKERRQ(ierr);
556b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.row[row],&lr);CHKERRQ(ierr);
557b6480e04SStefano Zampini       ierr = ISGetLocalSize(vs->isglobal.col[col],&lc);CHKERRQ(ierr);
558b6480e04SStefano Zampini       ierr = MatSetSizes(vs->m[row][col],lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr);
559b6480e04SStefano Zampini       ierr = MatSetUp(vs->m[row][col]);CHKERRQ(ierr);
560b6480e04SStefano Zampini       ierr = MatAssemblyBegin(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
561b6480e04SStefano Zampini       ierr = MatAssemblyEnd(vs->m[row][col],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
562b6480e04SStefano Zampini     }
563f349c1fdSJed Brown     *B = vs->m[row][col];
5648188e55aSJed Brown   }
565f349c1fdSJed Brown   PetscFunctionReturn(0);
566f349c1fdSJed Brown }
567f349c1fdSJed Brown 
5687dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B)
569f349c1fdSJed Brown {
570f349c1fdSJed Brown   PetscErrorCode ierr;
571f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
572f349c1fdSJed Brown   Mat            sub;
573f349c1fdSJed Brown 
574f349c1fdSJed Brown   PetscFunctionBegin;
575f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr);
576f349c1fdSJed Brown   switch (reuse) {
577f349c1fdSJed Brown   case MAT_INITIAL_MATRIX:
5787874fa86SDave May     if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); }
579f349c1fdSJed Brown     *B = sub;
580f349c1fdSJed Brown     break;
581f349c1fdSJed Brown   case MAT_REUSE_MATRIX:
582ce94432eSBarry Smith     if (sub != *B) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call");
583f349c1fdSJed Brown     break;
584f349c1fdSJed Brown   case MAT_IGNORE_MATRIX:       /* Nothing to do */
585f349c1fdSJed Brown     break;
586511c6705SHong Zhang   case MAT_INPLACE_MATRIX:       /* Nothing to do */
587511c6705SHong Zhang     SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet");
588511c6705SHong Zhang     break;
589f349c1fdSJed Brown   }
590f349c1fdSJed Brown   PetscFunctionReturn(0);
591f349c1fdSJed Brown }
592f349c1fdSJed Brown 
593f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
594f349c1fdSJed Brown {
595f349c1fdSJed Brown   PetscErrorCode ierr;
596f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
597f349c1fdSJed Brown   Mat            sub;
598f349c1fdSJed Brown 
599f349c1fdSJed Brown   PetscFunctionBegin;
600f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
601f349c1fdSJed Brown   /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */
602f349c1fdSJed Brown   if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);}
603f349c1fdSJed Brown   *B = sub;
604d8588912SDave May   PetscFunctionReturn(0);
605d8588912SDave May }
606d8588912SDave May 
607207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B)
608d8588912SDave May {
609d8588912SDave May   PetscErrorCode ierr;
610f349c1fdSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
611f349c1fdSJed Brown   Mat            sub;
612d8588912SDave May 
613d8588912SDave May   PetscFunctionBegin;
614f349c1fdSJed Brown   ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr);
615ce94432eSBarry Smith   if (*B != sub) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten");
616f349c1fdSJed Brown   if (sub) {
617ce94432eSBarry Smith     if (((PetscObject)sub)->refct <= 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times");
6186bf464f9SBarry Smith     ierr = MatDestroy(B);CHKERRQ(ierr);
619d8588912SDave May   }
620d8588912SDave May   PetscFunctionReturn(0);
621d8588912SDave May }
622d8588912SDave May 
6237874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v)
6247874fa86SDave May {
6257874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
6267874fa86SDave May   PetscInt       i;
6277874fa86SDave May   PetscErrorCode ierr;
6287874fa86SDave May 
6297874fa86SDave May   PetscFunctionBegin;
6307874fa86SDave May   for (i=0; i<bA->nr; i++) {
631429bac76SJed Brown     Vec bv;
632429bac76SJed Brown     ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
6337874fa86SDave May     if (bA->m[i][i]) {
634429bac76SJed Brown       ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr);
6357874fa86SDave May     } else {
6365159a857SMatthew G. Knepley       ierr = VecSet(bv,0.0);CHKERRQ(ierr);
6377874fa86SDave May     }
638429bac76SJed Brown     ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
6397874fa86SDave May   }
6407874fa86SDave May   PetscFunctionReturn(0);
6417874fa86SDave May }
6427874fa86SDave May 
6437874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r)
6447874fa86SDave May {
6457874fa86SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
646429bac76SJed Brown   Vec            bl,*br;
6477874fa86SDave May   PetscInt       i,j;
6487874fa86SDave May   PetscErrorCode ierr;
6497874fa86SDave May 
6507874fa86SDave May   PetscFunctionBegin;
6513f800ebeSJed Brown   ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr);
6522e6472ebSElliott Sales de Andrade   if (r) {
653429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
6542e6472ebSElliott Sales de Andrade   }
6552e6472ebSElliott Sales de Andrade   bl = NULL;
6567874fa86SDave May   for (i=0; i<bA->nr; i++) {
6572e6472ebSElliott Sales de Andrade     if (l) {
658429bac76SJed Brown       ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
6592e6472ebSElliott Sales de Andrade     }
6607874fa86SDave May     for (j=0; j<bA->nc; j++) {
6617874fa86SDave May       if (bA->m[i][j]) {
662429bac76SJed Brown         ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr);
6637874fa86SDave May       }
6647874fa86SDave May     }
6652e6472ebSElliott Sales de Andrade     if (l) {
666a061e289SJed Brown       ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr);
6677874fa86SDave May     }
6682e6472ebSElliott Sales de Andrade   }
6692e6472ebSElliott Sales de Andrade   if (r) {
670429bac76SJed Brown     for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);}
6712e6472ebSElliott Sales de Andrade   }
672429bac76SJed Brown   ierr = PetscFree(br);CHKERRQ(ierr);
6737874fa86SDave May   PetscFunctionReturn(0);
6747874fa86SDave May }
6757874fa86SDave May 
676a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a)
677a061e289SJed Brown {
678a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
679a061e289SJed Brown   PetscInt       i,j;
680a061e289SJed Brown   PetscErrorCode ierr;
681a061e289SJed Brown 
682a061e289SJed Brown   PetscFunctionBegin;
683a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
684a061e289SJed Brown     for (j=0; j<bA->nc; j++) {
685a061e289SJed Brown       if (bA->m[i][j]) {
686a061e289SJed Brown         ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr);
687a061e289SJed Brown       }
688a061e289SJed Brown     }
689a061e289SJed Brown   }
690a061e289SJed Brown   PetscFunctionReturn(0);
691a061e289SJed Brown }
692a061e289SJed Brown 
693a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a)
694a061e289SJed Brown {
695a061e289SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
696a061e289SJed Brown   PetscInt       i;
697a061e289SJed Brown   PetscErrorCode ierr;
698a061e289SJed Brown 
699a061e289SJed Brown   PetscFunctionBegin;
700a061e289SJed Brown   for (i=0; i<bA->nr; i++) {
701ce94432eSBarry Smith     if (!bA->m[i][i]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%D,%D)",i,i);
702a061e289SJed Brown     ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr);
703a061e289SJed Brown   }
704a061e289SJed Brown   PetscFunctionReturn(0);
705a061e289SJed Brown }
706a061e289SJed Brown 
70713135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is)
70813135bc6SAlex Fikl {
70913135bc6SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
71013135bc6SAlex Fikl   PetscInt       i;
71113135bc6SAlex Fikl   PetscErrorCode ierr;
71213135bc6SAlex Fikl 
71313135bc6SAlex Fikl   PetscFunctionBegin;
71413135bc6SAlex Fikl   for (i=0; i<bA->nr; i++) {
71513135bc6SAlex Fikl     Vec bv;
71613135bc6SAlex Fikl     ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
71713135bc6SAlex Fikl     if (bA->m[i][i]) {
71813135bc6SAlex Fikl       ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr);
71913135bc6SAlex Fikl     }
72013135bc6SAlex Fikl     ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr);
72113135bc6SAlex Fikl   }
72213135bc6SAlex Fikl   PetscFunctionReturn(0);
72313135bc6SAlex Fikl }
72413135bc6SAlex Fikl 
725f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx)
726f8170845SAlex Fikl {
727f8170845SAlex Fikl   Mat_Nest       *bA = (Mat_Nest*)A->data;
728f8170845SAlex Fikl   PetscInt       i,j;
729f8170845SAlex Fikl   PetscErrorCode ierr;
730f8170845SAlex Fikl 
731f8170845SAlex Fikl   PetscFunctionBegin;
732f8170845SAlex Fikl   for (i=0; i<bA->nr; i++) {
733f8170845SAlex Fikl     for (j=0; j<bA->nc; j++) {
734f8170845SAlex Fikl       if (bA->m[i][j]) {
735f8170845SAlex Fikl         ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr);
736f8170845SAlex Fikl       }
737f8170845SAlex Fikl     }
738f8170845SAlex Fikl   }
739f8170845SAlex Fikl   PetscFunctionReturn(0);
740f8170845SAlex Fikl }
741f8170845SAlex Fikl 
7422a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left)
743d8588912SDave May {
744d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
745d8588912SDave May   Vec            *L,*R;
746d8588912SDave May   MPI_Comm       comm;
747d8588912SDave May   PetscInt       i,j;
748d8588912SDave May   PetscErrorCode ierr;
749d8588912SDave May 
750d8588912SDave May   PetscFunctionBegin;
751ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
752d8588912SDave May   if (right) {
753d8588912SDave May     /* allocate R */
754854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr);
755d8588912SDave May     /* Create the right vectors */
756d8588912SDave May     for (j=0; j<bA->nc; j++) {
757d8588912SDave May       for (i=0; i<bA->nr; i++) {
758d8588912SDave May         if (bA->m[i][j]) {
7592a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr);
760d8588912SDave May           break;
761d8588912SDave May         }
762d8588912SDave May       }
7636c4ed002SBarry Smith       if (i==bA->nr) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column.");
764d8588912SDave May     }
765f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr);
766d8588912SDave May     /* hand back control to the nest vector */
767d8588912SDave May     for (j=0; j<bA->nc; j++) {
7686bf464f9SBarry Smith       ierr = VecDestroy(&R[j]);CHKERRQ(ierr);
769d8588912SDave May     }
770d8588912SDave May     ierr = PetscFree(R);CHKERRQ(ierr);
771d8588912SDave May   }
772d8588912SDave May 
773d8588912SDave May   if (left) {
774d8588912SDave May     /* allocate L */
775854ce69bSBarry Smith     ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr);
776d8588912SDave May     /* Create the left vectors */
777d8588912SDave May     for (i=0; i<bA->nr; i++) {
778d8588912SDave May       for (j=0; j<bA->nc; j++) {
779d8588912SDave May         if (bA->m[i][j]) {
7802a7a6963SBarry Smith           ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr);
781d8588912SDave May           break;
782d8588912SDave May         }
783d8588912SDave May       }
7846c4ed002SBarry Smith       if (j==bA->nc) SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row.");
785d8588912SDave May     }
786d8588912SDave May 
787f349c1fdSJed Brown     ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr);
788d8588912SDave May     for (i=0; i<bA->nr; i++) {
7896bf464f9SBarry Smith       ierr = VecDestroy(&L[i]);CHKERRQ(ierr);
790d8588912SDave May     }
791d8588912SDave May 
792d8588912SDave May     ierr = PetscFree(L);CHKERRQ(ierr);
793d8588912SDave May   }
794d8588912SDave May   PetscFunctionReturn(0);
795d8588912SDave May }
796d8588912SDave May 
797207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer)
798d8588912SDave May {
799d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
80029e60adbSStefano Zampini   PetscBool      isascii,viewSub = PETSC_FALSE;
801d8588912SDave May   PetscInt       i,j;
802d8588912SDave May   PetscErrorCode ierr;
803d8588912SDave May 
804d8588912SDave May   PetscFunctionBegin;
805251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
806d8588912SDave May   if (isascii) {
807d8588912SDave May 
80829e60adbSStefano Zampini     ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr);
809d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr);
810d86155a6SBarry Smith     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
811d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%D, cols=%D \n",bA->nr,bA->nc);CHKERRQ(ierr);
812d8588912SDave May 
813d86155a6SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr);
814d8588912SDave May     for (i=0; i<bA->nr; i++) {
815d8588912SDave May       for (j=0; j<bA->nc; j++) {
81619fd82e9SBarry Smith         MatType   type;
817270f95d7SJed Brown         char      name[256] = "",prefix[256] = "";
818d8588912SDave May         PetscInt  NR,NC;
819d8588912SDave May         PetscBool isNest = PETSC_FALSE;
820d8588912SDave May 
821d8588912SDave May         if (!bA->m[i][j]) {
822d86155a6SBarry Smith           CHKERRQ(ierr);PetscViewerASCIIPrintf(viewer, "(%D,%D) : NULL \n",i,j);CHKERRQ(ierr);
823d8588912SDave May           continue;
824d8588912SDave May         }
825d8588912SDave May         ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr);
826d8588912SDave May         ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr);
8278caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);}
8288caf3d72SBarry Smith         if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);}
829251f4c67SDmitry Karpeev         ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr);
830d8588912SDave May 
831270f95d7SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"(%D,%D) : %s%stype=%s, rows=%D, cols=%D \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr);
832d8588912SDave May 
83329e60adbSStefano Zampini         if (isNest || viewSub) {
834270f95d7SJed Brown           ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);  /* push1 */
835d8588912SDave May           ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr);
836270f95d7SJed Brown           ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop1 */
837d8588912SDave May         }
838d8588912SDave May       }
839d8588912SDave May     }
840d86155a6SBarry Smith     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);    /* pop0 */
841d8588912SDave May   }
842d8588912SDave May   PetscFunctionReturn(0);
843d8588912SDave May }
844d8588912SDave May 
845207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A)
846d8588912SDave May {
847d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
848d8588912SDave May   PetscInt       i,j;
849d8588912SDave May   PetscErrorCode ierr;
850d8588912SDave May 
851d8588912SDave May   PetscFunctionBegin;
852d8588912SDave May   for (i=0; i<bA->nr; i++) {
853d8588912SDave May     for (j=0; j<bA->nc; j++) {
854d8588912SDave May       if (!bA->m[i][j]) continue;
855d8588912SDave May       ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr);
856d8588912SDave May     }
857d8588912SDave May   }
858d8588912SDave May   PetscFunctionReturn(0);
859d8588912SDave May }
860d8588912SDave May 
861c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str)
862c222c20dSDavid Ham {
863c222c20dSDavid Ham   Mat_Nest       *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data;
864c222c20dSDavid Ham   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
865c222c20dSDavid Ham   PetscErrorCode ierr;
866c222c20dSDavid Ham 
867c222c20dSDavid Ham   PetscFunctionBegin;
868c222c20dSDavid Ham   if (nr != bB->nr || nc != bB->nc) SETERRQ4(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%D,%D) to a Mat_Nest of block size (%D,%D)",bB->nr,bB->nc,nr,nc);
869c222c20dSDavid Ham   for (i=0; i<nr; i++) {
870c222c20dSDavid Ham     for (j=0; j<nc; j++) {
87146a2b97cSJed Brown       if (bA->m[i][j] && bB->m[i][j]) {
872c222c20dSDavid Ham         ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr);
87346a2b97cSJed Brown       } else if (bA->m[i][j] || bB->m[i][j]) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
874c222c20dSDavid Ham     }
875c222c20dSDavid Ham   }
876cdc753b6SBarry Smith   ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr);
877c222c20dSDavid Ham   PetscFunctionReturn(0);
878c222c20dSDavid Ham }
879c222c20dSDavid Ham 
8806e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str)
8816e76ffeaSPierre Jolivet {
8826e76ffeaSPierre Jolivet   Mat_Nest       *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data;
8836e76ffeaSPierre Jolivet   PetscInt       i,j,nr = bY->nr,nc = bY->nc;
8846e76ffeaSPierre Jolivet   PetscErrorCode ierr;
8856e76ffeaSPierre Jolivet 
8866e76ffeaSPierre Jolivet   PetscFunctionBegin;
8876e76ffeaSPierre Jolivet   if (nr != bX->nr || nc != bX->nc) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%D,%D) with a MatNest of block size (%D,%D)",bX->nr,bX->nc,nr,nc);
8886e76ffeaSPierre Jolivet   for (i=0; i<nr; i++) {
8896e76ffeaSPierre Jolivet     for (j=0; j<nc; j++) {
8906e76ffeaSPierre Jolivet       if (bY->m[i][j] && bX->m[i][j]) {
8916e76ffeaSPierre Jolivet         ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr);
892c066aebcSStefano Zampini       } else if (bX->m[i][j]) {
893c066aebcSStefano Zampini         Mat M;
894c066aebcSStefano Zampini 
895c066aebcSStefano Zampini         if (str != DIFFERENT_NONZERO_PATTERN) SETERRQ2(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %D,%D",i,j);
896c066aebcSStefano Zampini         ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr);
897c066aebcSStefano Zampini         ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr);
898c066aebcSStefano Zampini         ierr = MatDestroy(&M);CHKERRQ(ierr);
899c066aebcSStefano Zampini       }
9006e76ffeaSPierre Jolivet     }
9016e76ffeaSPierre Jolivet   }
9026e76ffeaSPierre Jolivet   PetscFunctionReturn(0);
9036e76ffeaSPierre Jolivet }
9046e76ffeaSPierre Jolivet 
905207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B)
906d8588912SDave May {
907d8588912SDave May   Mat_Nest       *bA = (Mat_Nest*)A->data;
908841e96a3SJed Brown   Mat            *b;
909841e96a3SJed Brown   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
910d8588912SDave May   PetscErrorCode ierr;
911d8588912SDave May 
912d8588912SDave May   PetscFunctionBegin;
913785e854fSJed Brown   ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr);
914841e96a3SJed Brown   for (i=0; i<nr; i++) {
915841e96a3SJed Brown     for (j=0; j<nc; j++) {
916841e96a3SJed Brown       if (bA->m[i][j]) {
917841e96a3SJed Brown         ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr);
918841e96a3SJed Brown       } else {
9190298fd71SBarry Smith         b[i*nc+j] = NULL;
920d8588912SDave May       }
921d8588912SDave May     }
922d8588912SDave May   }
923ce94432eSBarry Smith   ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr);
924841e96a3SJed Brown   /* Give the new MatNest exclusive ownership */
925841e96a3SJed Brown   for (i=0; i<nr*nc; i++) {
9266bf464f9SBarry Smith     ierr = MatDestroy(&b[i]);CHKERRQ(ierr);
927d8588912SDave May   }
928d8588912SDave May   ierr = PetscFree(b);CHKERRQ(ierr);
929d8588912SDave May 
930841e96a3SJed Brown   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
931841e96a3SJed Brown   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
932d8588912SDave May   PetscFunctionReturn(0);
933d8588912SDave May }
934d8588912SDave May 
935d8588912SDave May /* nest api */
936d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat)
937d8588912SDave May {
938d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
9395fd66863SKarl Rupp 
940d8588912SDave May   PetscFunctionBegin;
941ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
942ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
943d8588912SDave May   *mat = bA->m[idxm][jdxm];
944d8588912SDave May   PetscFunctionReturn(0);
945d8588912SDave May }
946d8588912SDave May 
9479ba0d327SJed Brown /*@
948d8588912SDave May  MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix.
949d8588912SDave May 
950d8588912SDave May  Not collective
951d8588912SDave May 
952d8588912SDave May  Input Parameters:
953629881c0SJed Brown +   A  - nest matrix
954d8588912SDave May .   idxm - index of the matrix within the nest matrix
955629881c0SJed Brown -   jdxm - index of the matrix within the nest matrix
956d8588912SDave May 
957d8588912SDave May  Output Parameter:
958d8588912SDave May .   sub - matrix at index idxm,jdxm within the nest matrix
959d8588912SDave May 
960d8588912SDave May  Level: developer
961d8588912SDave May 
962*79798668SBarry Smith .seealso: MatNestGetSize(), MatNestGetSubMats(), MatNestCreate(), MATNEST, MatNestSetSubMat(),
963*79798668SBarry Smith           MatNestGetLocalISs(), MatNestGetISs()
964d8588912SDave May @*/
9657087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub)
966d8588912SDave May {
967699a902aSJed Brown   PetscErrorCode ierr;
968d8588912SDave May 
969d8588912SDave May   PetscFunctionBegin;
970699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr);
971d8588912SDave May   PetscFunctionReturn(0);
972d8588912SDave May }
973d8588912SDave May 
9740782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat)
9750782ca92SJed Brown {
9760782ca92SJed Brown   Mat_Nest       *bA = (Mat_Nest*)A->data;
9770782ca92SJed Brown   PetscInt       m,n,M,N,mi,ni,Mi,Ni;
9780782ca92SJed Brown   PetscErrorCode ierr;
9790782ca92SJed Brown 
9800782ca92SJed Brown   PetscFunctionBegin;
981ce94432eSBarry Smith   if (idxm >= bA->nr) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",idxm,bA->nr-1);
982ce94432eSBarry Smith   if (jdxm >= bA->nc) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %D max %D",jdxm,bA->nc-1);
9830782ca92SJed Brown   ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr);
9840782ca92SJed Brown   ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr);
9850782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr);
9860782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr);
9870782ca92SJed Brown   ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr);
9880782ca92SJed Brown   ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr);
989ce94432eSBarry Smith   if (M != Mi || N != Ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%D,%D) incompatible with nest block (%D,%D)",M,N,Mi,Ni);
990ce94432eSBarry Smith   if (m != mi || n != ni) SETERRQ4(PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%D,%D) incompatible with nest block (%D,%D)",m,n,mi,ni);
99126fbe8dcSKarl Rupp 
9920782ca92SJed Brown   ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr);
9930782ca92SJed Brown   ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr);
9940782ca92SJed Brown   bA->m[idxm][jdxm] = mat;
9950782ca92SJed Brown   PetscFunctionReturn(0);
9960782ca92SJed Brown }
9970782ca92SJed Brown 
9989ba0d327SJed Brown /*@
9990782ca92SJed Brown  MatNestSetSubMat - Set a single submatrix in the nest matrix.
10000782ca92SJed Brown 
10010782ca92SJed Brown  Logically collective on the submatrix communicator
10020782ca92SJed Brown 
10030782ca92SJed Brown  Input Parameters:
10040782ca92SJed Brown +   A  - nest matrix
10050782ca92SJed Brown .   idxm - index of the matrix within the nest matrix
10060782ca92SJed Brown .   jdxm - index of the matrix within the nest matrix
10070782ca92SJed Brown -   sub - matrix at index idxm,jdxm within the nest matrix
10080782ca92SJed Brown 
10090782ca92SJed Brown  Notes:
10100782ca92SJed Brown  The new submatrix must have the same size and communicator as that block of the nest.
10110782ca92SJed Brown 
10120782ca92SJed Brown  This increments the reference count of the submatrix.
10130782ca92SJed Brown 
10140782ca92SJed Brown  Level: developer
10150782ca92SJed Brown 
1016*79798668SBarry Smith .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatNestCreate(),
1017*79798668SBarry Smith           MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize()
10180782ca92SJed Brown @*/
10190782ca92SJed Brown PetscErrorCode  MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub)
10200782ca92SJed Brown {
10210782ca92SJed Brown   PetscErrorCode ierr;
10220782ca92SJed Brown 
10230782ca92SJed Brown   PetscFunctionBegin;
10240782ca92SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr);
10250782ca92SJed Brown   PetscFunctionReturn(0);
10260782ca92SJed Brown }
10270782ca92SJed Brown 
1028d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1029d8588912SDave May {
1030d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
10315fd66863SKarl Rupp 
1032d8588912SDave May   PetscFunctionBegin;
103326fbe8dcSKarl Rupp   if (M)   *M   = bA->nr;
103426fbe8dcSKarl Rupp   if (N)   *N   = bA->nc;
103526fbe8dcSKarl Rupp   if (mat) *mat = bA->m;
1036d8588912SDave May   PetscFunctionReturn(0);
1037d8588912SDave May }
1038d8588912SDave May 
1039d8588912SDave May /*@C
1040d8588912SDave May  MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix.
1041d8588912SDave May 
1042d8588912SDave May  Not collective
1043d8588912SDave May 
1044d8588912SDave May  Input Parameters:
1045629881c0SJed Brown .   A  - nest matrix
1046d8588912SDave May 
1047d8588912SDave May  Output Parameter:
1048629881c0SJed Brown +   M - number of rows in the nest matrix
1049d8588912SDave May .   N - number of cols in the nest matrix
1050629881c0SJed Brown -   mat - 2d array of matrices
1051d8588912SDave May 
1052d8588912SDave May  Notes:
1053d8588912SDave May 
1054d8588912SDave May  The user should not free the array mat.
1055d8588912SDave May 
1056351962e3SVincent Le Chenadec  In Fortran, this routine has a calling sequence
1057351962e3SVincent Le Chenadec $   call MatNestGetSubMats(A, M, N, mat, ierr)
1058351962e3SVincent Le Chenadec  where the space allocated for the optional argument mat is assumed large enough (if provided).
1059351962e3SVincent Le Chenadec 
1060d8588912SDave May  Level: developer
1061d8588912SDave May 
1062*79798668SBarry Smith .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatNestCreate(),
1063*79798668SBarry Smith           MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat()
1064d8588912SDave May @*/
10657087cfbeSBarry Smith PetscErrorCode  MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat)
1066d8588912SDave May {
1067699a902aSJed Brown   PetscErrorCode ierr;
1068d8588912SDave May 
1069d8588912SDave May   PetscFunctionBegin;
1070699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr);
1071d8588912SDave May   PetscFunctionReturn(0);
1072d8588912SDave May }
1073d8588912SDave May 
10747087cfbeSBarry Smith PetscErrorCode  MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N)
1075d8588912SDave May {
1076d8588912SDave May   Mat_Nest *bA = (Mat_Nest*)A->data;
1077d8588912SDave May 
1078d8588912SDave May   PetscFunctionBegin;
107926fbe8dcSKarl Rupp   if (M) *M = bA->nr;
108026fbe8dcSKarl Rupp   if (N) *N = bA->nc;
1081d8588912SDave May   PetscFunctionReturn(0);
1082d8588912SDave May }
1083d8588912SDave May 
10849ba0d327SJed Brown /*@
1085d8588912SDave May  MatNestGetSize - Returns the size of the nest matrix.
1086d8588912SDave May 
1087d8588912SDave May  Not collective
1088d8588912SDave May 
1089d8588912SDave May  Input Parameters:
1090d8588912SDave May .   A  - nest matrix
1091d8588912SDave May 
1092d8588912SDave May  Output Parameter:
1093629881c0SJed Brown +   M - number of rows in the nested mat
1094629881c0SJed Brown -   N - number of cols in the nested mat
1095d8588912SDave May 
1096d8588912SDave May  Notes:
1097d8588912SDave May 
1098d8588912SDave May  Level: developer
1099d8588912SDave May 
1100*79798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatNestCreate(), MatNestGetLocalISs(),
1101*79798668SBarry Smith           MatNestGetISs()
1102d8588912SDave May @*/
11037087cfbeSBarry Smith PetscErrorCode  MatNestGetSize(Mat A,PetscInt *M,PetscInt *N)
1104d8588912SDave May {
1105699a902aSJed Brown   PetscErrorCode ierr;
1106d8588912SDave May 
1107d8588912SDave May   PetscFunctionBegin;
1108699a902aSJed Brown   ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr);
1109d8588912SDave May   PetscFunctionReturn(0);
1110d8588912SDave May }
1111d8588912SDave May 
1112f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[])
1113900e7ff2SJed Brown {
1114900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1115900e7ff2SJed Brown   PetscInt i;
1116900e7ff2SJed Brown 
1117900e7ff2SJed Brown   PetscFunctionBegin;
1118900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i];
1119900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i];
1120900e7ff2SJed Brown   PetscFunctionReturn(0);
1121900e7ff2SJed Brown }
1122900e7ff2SJed Brown 
11233a4d7b9aSSatish Balay /*@C
1124900e7ff2SJed Brown  MatNestGetISs - Returns the index sets partitioning the row and column spaces
1125900e7ff2SJed Brown 
1126900e7ff2SJed Brown  Not collective
1127900e7ff2SJed Brown 
1128900e7ff2SJed Brown  Input Parameters:
1129900e7ff2SJed Brown .   A  - nest matrix
1130900e7ff2SJed Brown 
1131900e7ff2SJed Brown  Output Parameter:
1132900e7ff2SJed Brown +   rows - array of row index sets
1133900e7ff2SJed Brown -   cols - array of column index sets
1134900e7ff2SJed Brown 
1135900e7ff2SJed Brown  Level: advanced
1136900e7ff2SJed Brown 
1137900e7ff2SJed Brown  Notes:
1138900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1139900e7ff2SJed Brown 
1140*79798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST,
1141*79798668SBarry Smith           MatNestCreate(), MatNestGetSubMats(), MatNestSetSubMats()
1142900e7ff2SJed Brown @*/
1143900e7ff2SJed Brown PetscErrorCode  MatNestGetISs(Mat A,IS rows[],IS cols[])
1144900e7ff2SJed Brown {
1145900e7ff2SJed Brown   PetscErrorCode ierr;
1146900e7ff2SJed Brown 
1147900e7ff2SJed Brown   PetscFunctionBegin;
1148900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1149900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1150900e7ff2SJed Brown   PetscFunctionReturn(0);
1151900e7ff2SJed Brown }
1152900e7ff2SJed Brown 
1153f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[])
1154900e7ff2SJed Brown {
1155900e7ff2SJed Brown   Mat_Nest *vs = (Mat_Nest*)A->data;
1156900e7ff2SJed Brown   PetscInt i;
1157900e7ff2SJed Brown 
1158900e7ff2SJed Brown   PetscFunctionBegin;
1159900e7ff2SJed Brown   if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i];
1160900e7ff2SJed Brown   if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i];
1161900e7ff2SJed Brown   PetscFunctionReturn(0);
1162900e7ff2SJed Brown }
1163900e7ff2SJed Brown 
1164900e7ff2SJed Brown /*@C
1165900e7ff2SJed Brown  MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces
1166900e7ff2SJed Brown 
1167900e7ff2SJed Brown  Not collective
1168900e7ff2SJed Brown 
1169900e7ff2SJed Brown  Input Parameters:
1170900e7ff2SJed Brown .   A  - nest matrix
1171900e7ff2SJed Brown 
1172900e7ff2SJed Brown  Output Parameter:
11730298fd71SBarry Smith +   rows - array of row index sets (or NULL to ignore)
11740298fd71SBarry Smith -   cols - array of column index sets (or NULL to ignore)
1175900e7ff2SJed Brown 
1176900e7ff2SJed Brown  Level: advanced
1177900e7ff2SJed Brown 
1178900e7ff2SJed Brown  Notes:
1179900e7ff2SJed Brown  The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs.
1180900e7ff2SJed Brown 
1181*79798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatNestCreate(),
1182*79798668SBarry Smith           MATNEST, MatNestSetSubMats(), MatNestSetSubMat()
1183900e7ff2SJed Brown @*/
1184900e7ff2SJed Brown PetscErrorCode  MatNestGetLocalISs(Mat A,IS rows[],IS cols[])
1185900e7ff2SJed Brown {
1186900e7ff2SJed Brown   PetscErrorCode ierr;
1187900e7ff2SJed Brown 
1188900e7ff2SJed Brown   PetscFunctionBegin;
1189900e7ff2SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1190900e7ff2SJed Brown   ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr);
1191900e7ff2SJed Brown   PetscFunctionReturn(0);
1192900e7ff2SJed Brown }
1193900e7ff2SJed Brown 
119419fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType_Nest(Mat A,VecType vtype)
1195207556f9SJed Brown {
1196207556f9SJed Brown   PetscErrorCode ierr;
1197207556f9SJed Brown   PetscBool      flg;
1198207556f9SJed Brown 
1199207556f9SJed Brown   PetscFunctionBegin;
1200207556f9SJed Brown   ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr);
1201207556f9SJed Brown   /* In reality, this only distinguishes VECNEST and "other" */
12022a7a6963SBarry Smith   if (flg) A->ops->getvecs = MatCreateVecs_Nest;
120312b53f24SSatish Balay   else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0;
1204207556f9SJed Brown   PetscFunctionReturn(0);
1205207556f9SJed Brown }
1206207556f9SJed Brown 
1207207556f9SJed Brown /*@C
12082a7a6963SBarry Smith  MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs()
1209207556f9SJed Brown 
1210207556f9SJed Brown  Not collective
1211207556f9SJed Brown 
1212207556f9SJed Brown  Input Parameters:
1213207556f9SJed Brown +  A  - nest matrix
1214207556f9SJed Brown -  vtype - type to use for creating vectors
1215207556f9SJed Brown 
1216207556f9SJed Brown  Notes:
1217207556f9SJed Brown 
1218207556f9SJed Brown  Level: developer
1219207556f9SJed Brown 
1220*79798668SBarry Smith .seealso: MatCreateVecs(), MATNEST, MatNestCreate()
1221207556f9SJed Brown @*/
122219fd82e9SBarry Smith PetscErrorCode  MatNestSetVecType(Mat A,VecType vtype)
1223207556f9SJed Brown {
1224207556f9SJed Brown   PetscErrorCode ierr;
1225207556f9SJed Brown 
1226207556f9SJed Brown   PetscFunctionBegin;
122719fd82e9SBarry Smith   ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr);
1228207556f9SJed Brown   PetscFunctionReturn(0);
1229207556f9SJed Brown }
1230207556f9SJed Brown 
1231c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1232d8588912SDave May {
1233c8883902SJed Brown   Mat_Nest       *s = (Mat_Nest*)A->data;
1234c8883902SJed Brown   PetscInt       i,j,m,n,M,N;
1235d8588912SDave May   PetscErrorCode ierr;
1236d8588912SDave May 
1237d8588912SDave May   PetscFunctionBegin;
1238c8883902SJed Brown   s->nr = nr;
1239c8883902SJed Brown   s->nc = nc;
1240d8588912SDave May 
1241c8883902SJed Brown   /* Create space for submatrices */
1242854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr);
1243c8883902SJed Brown   for (i=0; i<nr; i++) {
1244854ce69bSBarry Smith     ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr);
1245d8588912SDave May   }
1246c8883902SJed Brown   for (i=0; i<nr; i++) {
1247c8883902SJed Brown     for (j=0; j<nc; j++) {
1248c8883902SJed Brown       s->m[i][j] = a[i*nc+j];
1249c8883902SJed Brown       if (a[i*nc+j]) {
1250c8883902SJed Brown         ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr);
1251d8588912SDave May       }
1252d8588912SDave May     }
1253d8588912SDave May   }
1254d8588912SDave May 
12558188e55aSJed Brown   ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr);
1256d8588912SDave May 
1257854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr);
1258854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr);
1259c8883902SJed Brown   for (i=0; i<nr; i++) s->row_len[i]=-1;
1260c8883902SJed Brown   for (j=0; j<nc; j++) s->col_len[j]=-1;
1261d8588912SDave May 
12628188e55aSJed Brown   ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr);
1263d8588912SDave May 
1264c8883902SJed Brown   ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr);
1265c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr);
1266c8883902SJed Brown   ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr);
1267c8883902SJed Brown   ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr);
1268c8883902SJed Brown 
1269c8883902SJed Brown   ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr);
1270c8883902SJed Brown   ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr);
1271c8883902SJed Brown 
12721795a4d1SJed Brown   ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr);
1273d8588912SDave May   PetscFunctionReturn(0);
1274d8588912SDave May }
1275d8588912SDave May 
1276c8883902SJed Brown /*@
1277c8883902SJed Brown    MatNestSetSubMats - Sets the nested submatrices
1278c8883902SJed Brown 
1279c8883902SJed Brown    Collective on Mat
1280c8883902SJed Brown 
1281c8883902SJed Brown    Input Parameter:
1282ffd6319bSRichard Tran Mills +  A - nested matrix
1283c8883902SJed Brown .  nr - number of nested row blocks
12840298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1285c8883902SJed Brown .  nc - number of nested column blocks
12860298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
12870298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1288c8883902SJed Brown 
1289c8883902SJed Brown    Level: advanced
1290c8883902SJed Brown 
1291*79798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats()
1292c8883902SJed Brown @*/
1293c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[])
1294c8883902SJed Brown {
1295c8883902SJed Brown   PetscErrorCode ierr;
1296eb6c2100SSatish Balay   PetscInt       i,nr_nc;
1297c8883902SJed Brown 
1298c8883902SJed Brown   PetscFunctionBegin;
1299c8883902SJed Brown   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
1300ce94432eSBarry Smith   if (nr < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative");
1301c8883902SJed Brown   if (nr && is_row) {
1302c8883902SJed Brown     PetscValidPointer(is_row,3);
1303c8883902SJed Brown     for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3);
1304c8883902SJed Brown   }
1305ce94432eSBarry Smith   if (nc < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative");
13061664e352SJed Brown   if (nc && is_col) {
1307c8883902SJed Brown     PetscValidPointer(is_col,5);
13089b30a8f6SBarry Smith     for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5);
1309c8883902SJed Brown   }
1310eb6c2100SSatish Balay   nr_nc=nr*nc;
1311eb6c2100SSatish Balay   if (nr_nc) PetscValidPointer(a,6);
1312c8883902SJed Brown   ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr);
1313c8883902SJed Brown   PetscFunctionReturn(0);
1314c8883902SJed Brown }
1315d8588912SDave May 
131645b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog)
131777019fcaSJed Brown {
131877019fcaSJed Brown   PetscErrorCode ierr;
131977019fcaSJed Brown   PetscBool      flg;
132077019fcaSJed Brown   PetscInt       i,j,m,mi,*ix;
132177019fcaSJed Brown 
132277019fcaSJed Brown   PetscFunctionBegin;
132377019fcaSJed Brown   for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) {
132477019fcaSJed Brown     if (islocal[i]) {
132577019fcaSJed Brown       ierr = ISGetSize(islocal[i],&mi);CHKERRQ(ierr);
132677019fcaSJed Brown       flg  = PETSC_TRUE;      /* We found a non-trivial entry */
132777019fcaSJed Brown     } else {
132877019fcaSJed Brown       ierr = ISGetSize(isglobal[i],&mi);CHKERRQ(ierr);
132977019fcaSJed Brown     }
133077019fcaSJed Brown     m += mi;
133177019fcaSJed Brown   }
133277019fcaSJed Brown   if (flg) {
1333785e854fSJed Brown     ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr);
1334165cd838SBarry Smith     for (i=0,m=0; i<n; i++) {
13350298fd71SBarry Smith       ISLocalToGlobalMapping smap = NULL;
1336e108cb99SStefano Zampini       Mat                    sub = NULL;
1337f6d38dbbSStefano Zampini       PetscSF                sf;
1338f6d38dbbSStefano Zampini       PetscLayout            map;
1339f6d38dbbSStefano Zampini       PetscInt               *ix2;
134077019fcaSJed Brown 
1341165cd838SBarry Smith       if (!colflg) {
134277019fcaSJed Brown         ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
134377019fcaSJed Brown       } else {
134477019fcaSJed Brown         ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
134577019fcaSJed Brown       }
1346191fd14bSBarry Smith       if (sub) {
1347191fd14bSBarry Smith         if (!colflg) {
1348191fd14bSBarry Smith           ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr);
1349191fd14bSBarry Smith         } else {
1350191fd14bSBarry Smith           ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr);
1351191fd14bSBarry Smith         }
1352191fd14bSBarry Smith       }
135377019fcaSJed Brown       if (islocal[i]) {
135477019fcaSJed Brown         ierr = ISGetSize(islocal[i],&mi);CHKERRQ(ierr);
135577019fcaSJed Brown       } else {
135677019fcaSJed Brown         ierr = ISGetSize(isglobal[i],&mi);CHKERRQ(ierr);
135777019fcaSJed Brown       }
135877019fcaSJed Brown       for (j=0; j<mi; j++) ix[m+j] = j;
135977019fcaSJed Brown       if (smap) {ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr);}
1360165cd838SBarry Smith 
136177019fcaSJed Brown       /*
136277019fcaSJed Brown         Now we need to extract the monolithic global indices that correspond to the given split global indices.
136377019fcaSJed Brown         In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces.
136477019fcaSJed Brown        */
1365f6d38dbbSStefano Zampini       ierr = PetscMalloc1(mi,&ix2);CHKERRQ(ierr);
1366f6d38dbbSStefano Zampini       ierr = PetscSFCreate(((PetscObject)isglobal[i])->comm,&sf);CHKERRQ(ierr);
1367f6d38dbbSStefano Zampini       ierr = PetscLayoutCreate(((PetscObject)isglobal[i])->comm,&map);CHKERRQ(ierr);
1368f6d38dbbSStefano Zampini       ierr = PetscLayoutSetLocalSize(map,mi);CHKERRQ(ierr);
1369f6d38dbbSStefano Zampini       ierr = PetscLayoutSetUp(map);CHKERRQ(ierr);
1370f6d38dbbSStefano Zampini       ierr = PetscSFSetGraphLayout(sf,map,mi,NULL,PETSC_USE_POINTER,ix+m);CHKERRQ(ierr);
1371f6d38dbbSStefano Zampini       ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr);
1372f6d38dbbSStefano Zampini       for (j=0; j<mi; j++) ix2[j] = ix[m+j];
1373f6d38dbbSStefano Zampini       ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1374f6d38dbbSStefano Zampini       ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m);CHKERRQ(ierr);
1375f6d38dbbSStefano Zampini       ierr = PetscSFDestroy(&sf);CHKERRQ(ierr);
1376f6d38dbbSStefano Zampini       ierr = PetscFree(ix2);CHKERRQ(ierr);
137777019fcaSJed Brown       m   += mi;
137877019fcaSJed Brown     }
1379f0413b6fSBarry Smith     ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr);
138077019fcaSJed Brown   } else {
13810298fd71SBarry Smith     *ltog = NULL;
138277019fcaSJed Brown   }
138377019fcaSJed Brown   PetscFunctionReturn(0);
138477019fcaSJed Brown }
138577019fcaSJed Brown 
138677019fcaSJed Brown 
1387d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */
1388d8588912SDave May /*
1389d8588912SDave May   nprocessors = NP
1390d8588912SDave May   Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1))
1391d8588912SDave May        proc 0: => (g_0,h_0,)
1392d8588912SDave May        proc 1: => (g_1,h_1,)
1393d8588912SDave May        ...
1394d8588912SDave May        proc nprocs-1: => (g_NP-1,h_NP-1,)
1395d8588912SDave May 
1396d8588912SDave May             proc 0:                      proc 1:                    proc nprocs-1:
1397d8588912SDave May     is[0] = (0,1,2,...,nlocal(g_0)-1)  (0,1,...,nlocal(g_1)-1)  (0,1,...,nlocal(g_NP-1))
1398d8588912SDave May 
1399d8588912SDave May             proc 0:
1400d8588912SDave May     is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1)
1401d8588912SDave May             proc 1:
1402d8588912SDave May     is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1)
1403d8588912SDave May 
1404d8588912SDave May             proc NP-1:
1405d8588912SDave May     is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1)
1406d8588912SDave May */
1407841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[])
1408d8588912SDave May {
1409e2d7f03fSJed Brown   Mat_Nest       *vs = (Mat_Nest*)A->data;
14108188e55aSJed Brown   PetscInt       i,j,offset,n,nsum,bs;
1411d8588912SDave May   PetscErrorCode ierr;
14120298fd71SBarry Smith   Mat            sub = NULL;
1413d8588912SDave May 
1414d8588912SDave May   PetscFunctionBegin;
1415854ce69bSBarry Smith   ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr);
1416854ce69bSBarry Smith   ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr);
1417d8588912SDave May   if (is_row) { /* valid IS is passed in */
1418d8588912SDave May     /* refs on is[] are incremeneted */
1419e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1420d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr);
142126fbe8dcSKarl Rupp 
1422e2d7f03fSJed Brown       vs->isglobal.row[i] = is_row[i];
1423d8588912SDave May     }
14242ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each row */
14258188e55aSJed Brown     nsum = 0;
14268188e55aSJed Brown     for (i=0; i<vs->nr; i++) {  /* Add up the local sizes to compute the aggregate offset */
14278188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
1428ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %D",i);
14290298fd71SBarry Smith       ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
1430ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
14318188e55aSJed Brown       nsum += n;
14328188e55aSJed Brown     }
1433ce94432eSBarry Smith     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRQ(ierr);
143430bc264bSJed Brown     offset -= nsum;
1435e2d7f03fSJed Brown     for (i=0; i<vs->nr; i++) {
1436f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
14370298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr);
14382ae74bdbSJed Brown       ierr    = MatGetBlockSize(sub,&bs);CHKERRQ(ierr);
1439ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr);
1440e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr);
14412ae74bdbSJed Brown       offset += n;
1442d8588912SDave May     }
1443d8588912SDave May   }
1444d8588912SDave May 
1445d8588912SDave May   if (is_col) { /* valid IS is passed in */
1446d8588912SDave May     /* refs on is[] are incremeneted */
1447e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1448d8588912SDave May       ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr);
144926fbe8dcSKarl Rupp 
1450e2d7f03fSJed Brown       vs->isglobal.col[j] = is_col[j];
1451d8588912SDave May     }
14522ae74bdbSJed Brown   } else {                      /* Create the ISs by inspecting sizes of a submatrix in each column */
14532ae74bdbSJed Brown     offset = A->cmap->rstart;
14548188e55aSJed Brown     nsum   = 0;
14558188e55aSJed Brown     for (j=0; j<vs->nc; j++) {
14568188e55aSJed Brown       ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
1457ce94432eSBarry Smith       if (!sub) SETERRQ1(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %D",i);
14580298fd71SBarry Smith       ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
1459ce94432eSBarry Smith       if (n < 0) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix");
14608188e55aSJed Brown       nsum += n;
14618188e55aSJed Brown     }
1462ce94432eSBarry Smith     ierr    = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRQ(ierr);
146330bc264bSJed Brown     offset -= nsum;
1464e2d7f03fSJed Brown     for (j=0; j<vs->nc; j++) {
1465f349c1fdSJed Brown       ierr    = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr);
14660298fd71SBarry Smith       ierr    = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr);
14672ae74bdbSJed Brown       ierr    = MatGetBlockSize(sub,&bs);CHKERRQ(ierr);
1468ce94432eSBarry Smith       ierr    = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr);
1469e2d7f03fSJed Brown       ierr    = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr);
14702ae74bdbSJed Brown       offset += n;
1471d8588912SDave May     }
1472d8588912SDave May   }
1473e2d7f03fSJed Brown 
1474e2d7f03fSJed Brown   /* Set up the local ISs */
1475785e854fSJed Brown   ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr);
1476785e854fSJed Brown   ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr);
1477e2d7f03fSJed Brown   for (i=0,offset=0; i<vs->nr; i++) {
1478e2d7f03fSJed Brown     IS                     isloc;
14790298fd71SBarry Smith     ISLocalToGlobalMapping rmap = NULL;
1480e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1481e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr);
14820298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);}
1483207556f9SJed Brown     if (rmap) {
1484e2d7f03fSJed Brown       ierr = MatGetBlockSize(sub,&bs);CHKERRQ(ierr);
1485e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr);
1486e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1487e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1488207556f9SJed Brown     } else {
1489207556f9SJed Brown       nlocal = 0;
14900298fd71SBarry Smith       isloc  = NULL;
1491207556f9SJed Brown     }
1492e2d7f03fSJed Brown     vs->islocal.row[i] = isloc;
1493e2d7f03fSJed Brown     offset            += nlocal;
1494e2d7f03fSJed Brown   }
14958188e55aSJed Brown   for (i=0,offset=0; i<vs->nc; i++) {
1496e2d7f03fSJed Brown     IS                     isloc;
14970298fd71SBarry Smith     ISLocalToGlobalMapping cmap = NULL;
1498e2d7f03fSJed Brown     PetscInt               nlocal,bs;
1499e2d7f03fSJed Brown     ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr);
15000298fd71SBarry Smith     if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);}
1501207556f9SJed Brown     if (cmap) {
1502e2d7f03fSJed Brown       ierr = MatGetBlockSize(sub,&bs);CHKERRQ(ierr);
1503e2d7f03fSJed Brown       ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr);
1504e2d7f03fSJed Brown       ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr);
1505e2d7f03fSJed Brown       ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr);
1506207556f9SJed Brown     } else {
1507207556f9SJed Brown       nlocal = 0;
15080298fd71SBarry Smith       isloc  = NULL;
1509207556f9SJed Brown     }
1510e2d7f03fSJed Brown     vs->islocal.col[i] = isloc;
1511e2d7f03fSJed Brown     offset            += nlocal;
1512e2d7f03fSJed Brown   }
15130189643fSJed Brown 
151477019fcaSJed Brown   /* Set up the aggregate ISLocalToGlobalMapping */
151577019fcaSJed Brown   {
151645b6f7e9SBarry Smith     ISLocalToGlobalMapping rmap,cmap;
151745b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr);
151845b6f7e9SBarry Smith     ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr);
151977019fcaSJed Brown     if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);}
152077019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr);
152177019fcaSJed Brown     ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr);
152277019fcaSJed Brown   }
152377019fcaSJed Brown 
15240189643fSJed Brown #if defined(PETSC_USE_DEBUG)
15250189643fSJed Brown   for (i=0; i<vs->nr; i++) {
15260189643fSJed Brown     for (j=0; j<vs->nc; j++) {
15270189643fSJed Brown       PetscInt m,n,M,N,mi,ni,Mi,Ni;
15280189643fSJed Brown       Mat      B = vs->m[i][j];
15290189643fSJed Brown       if (!B) continue;
15300189643fSJed Brown       ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr);
15310189643fSJed Brown       ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr);
15320189643fSJed Brown       ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr);
15330189643fSJed Brown       ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr);
15340189643fSJed Brown       ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr);
15350189643fSJed Brown       ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr);
1536ce94432eSBarry Smith       if (M != Mi || N != Ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",M,N,i,j,Mi,Ni);
1537ce94432eSBarry Smith       if (m != mi || n != ni) SETERRQ6(PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%D,%D) of nested submatrix (%D,%D) do not agree with space defined by index sets (%D,%D)",m,n,i,j,mi,ni);
15380189643fSJed Brown     }
15390189643fSJed Brown   }
15400189643fSJed Brown #endif
1541a061e289SJed Brown 
1542a061e289SJed Brown   /* Set A->assembled if all non-null blocks are currently assembled */
1543a061e289SJed Brown   for (i=0; i<vs->nr; i++) {
1544a061e289SJed Brown     for (j=0; j<vs->nc; j++) {
1545a061e289SJed Brown       if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0);
1546a061e289SJed Brown     }
1547a061e289SJed Brown   }
1548a061e289SJed Brown   A->assembled = PETSC_TRUE;
1549d8588912SDave May   PetscFunctionReturn(0);
1550d8588912SDave May }
1551d8588912SDave May 
155245c38901SJed Brown /*@C
1553659c6bb0SJed Brown    MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately
1554659c6bb0SJed Brown 
1555659c6bb0SJed Brown    Collective on Mat
1556659c6bb0SJed Brown 
1557659c6bb0SJed Brown    Input Parameter:
1558659c6bb0SJed Brown +  comm - Communicator for the new Mat
1559659c6bb0SJed Brown .  nr - number of nested row blocks
15600298fd71SBarry Smith .  is_row - index sets for each nested row block, or NULL to make contiguous
1561659c6bb0SJed Brown .  nc - number of nested column blocks
15620298fd71SBarry Smith .  is_col - index sets for each nested column block, or NULL to make contiguous
15630298fd71SBarry Smith -  a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL
1564659c6bb0SJed Brown 
1565659c6bb0SJed Brown    Output Parameter:
1566659c6bb0SJed Brown .  B - new matrix
1567659c6bb0SJed Brown 
1568659c6bb0SJed Brown    Level: advanced
1569659c6bb0SJed Brown 
1570*79798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(),
1571*79798668SBarry Smith           MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(),
1572*79798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1573659c6bb0SJed Brown @*/
15747087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B)
1575d8588912SDave May {
1576d8588912SDave May   Mat            A;
1577d8588912SDave May   PetscErrorCode ierr;
1578d8588912SDave May 
1579d8588912SDave May   PetscFunctionBegin;
1580c8883902SJed Brown   *B   = 0;
1581d8588912SDave May   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
1582c8883902SJed Brown   ierr = MatSetType(A,MATNEST);CHKERRQ(ierr);
158391a28eb3SBarry Smith   A->preallocated = PETSC_TRUE;
1584c8883902SJed Brown   ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr);
1585d8588912SDave May   *B   = A;
1586d8588912SDave May   PetscFunctionReturn(0);
1587d8588912SDave May }
1588659c6bb0SJed Brown 
1589b68353e5Sstefano_zampini static PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1590b68353e5Sstefano_zampini {
1591b68353e5Sstefano_zampini   Mat_Nest       *nest = (Mat_Nest*)A->data;
159223875855Sstefano_zampini   Mat            *trans;
1593b68353e5Sstefano_zampini   PetscScalar    **avv;
1594b68353e5Sstefano_zampini   PetscScalar    *vv;
1595b68353e5Sstefano_zampini   PetscInt       **aii,**ajj;
1596b68353e5Sstefano_zampini   PetscInt       *ii,*jj,*ci;
1597b68353e5Sstefano_zampini   PetscInt       nr,nc,nnz,i,j;
1598b68353e5Sstefano_zampini   PetscBool      done;
1599b68353e5Sstefano_zampini   PetscErrorCode ierr;
1600b68353e5Sstefano_zampini 
1601b68353e5Sstefano_zampini   PetscFunctionBegin;
1602b68353e5Sstefano_zampini   ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr);
1603b68353e5Sstefano_zampini   if (reuse == MAT_REUSE_MATRIX) {
1604b68353e5Sstefano_zampini     PetscInt rnr;
1605b68353e5Sstefano_zampini 
1606b68353e5Sstefano_zampini     ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr);
1607b68353e5Sstefano_zampini     if (!done) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ");
1608b68353e5Sstefano_zampini     if (rnr != nr) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows");
1609b68353e5Sstefano_zampini     ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr);
1610b68353e5Sstefano_zampini   }
1611b68353e5Sstefano_zampini   /* extract CSR for nested SeqAIJ matrices */
1612b68353e5Sstefano_zampini   nnz  = 0;
161323875855Sstefano_zampini   ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr);
1614b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1615b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1616b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1617b68353e5Sstefano_zampini       if (B) {
1618b68353e5Sstefano_zampini         PetscScalar *naa;
1619b68353e5Sstefano_zampini         PetscInt    *nii,*njj,nnr;
162023875855Sstefano_zampini         PetscBool   istrans;
1621b68353e5Sstefano_zampini 
162223875855Sstefano_zampini         ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
162323875855Sstefano_zampini         if (istrans) {
162423875855Sstefano_zampini           Mat Bt;
162523875855Sstefano_zampini 
162623875855Sstefano_zampini           ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
162723875855Sstefano_zampini           ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr);
162823875855Sstefano_zampini           B    = trans[i*nest->nc+j];
162923875855Sstefano_zampini         }
1630b68353e5Sstefano_zampini         ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr);
1631b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ");
1632b68353e5Sstefano_zampini         ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr);
1633b68353e5Sstefano_zampini         nnz += nii[nnr];
1634b68353e5Sstefano_zampini 
1635b68353e5Sstefano_zampini         aii[i*nest->nc+j] = nii;
1636b68353e5Sstefano_zampini         ajj[i*nest->nc+j] = njj;
1637b68353e5Sstefano_zampini         avv[i*nest->nc+j] = naa;
1638b68353e5Sstefano_zampini       }
1639b68353e5Sstefano_zampini     }
1640b68353e5Sstefano_zampini   }
1641b68353e5Sstefano_zampini   if (reuse != MAT_REUSE_MATRIX) {
1642b68353e5Sstefano_zampini     ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr);
1643b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr);
1644b68353e5Sstefano_zampini     ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr);
1645b68353e5Sstefano_zampini   } else {
1646b68353e5Sstefano_zampini     if (nnz != ii[nr]) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros");
1647b68353e5Sstefano_zampini   }
1648b68353e5Sstefano_zampini 
1649b68353e5Sstefano_zampini   /* new row pointer */
1650580bdb30SBarry Smith   ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr);
1651b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1652b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1653b68353e5Sstefano_zampini 
1654b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1655b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1656b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1657b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1658b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1659b68353e5Sstefano_zampini         PetscInt    ir;
1660b68353e5Sstefano_zampini 
1661b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1662b68353e5Sstefano_zampini           ii[ir+1] += nii[1]-nii[0];
1663b68353e5Sstefano_zampini           nii++;
1664b68353e5Sstefano_zampini         }
1665b68353e5Sstefano_zampini       }
1666b68353e5Sstefano_zampini     }
1667b68353e5Sstefano_zampini   }
1668b68353e5Sstefano_zampini   for (i=0; i<nr; i++) ii[i+1] += ii[i];
1669b68353e5Sstefano_zampini 
1670b68353e5Sstefano_zampini   /* construct CSR for the new matrix */
1671b68353e5Sstefano_zampini   ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr);
1672b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1673b68353e5Sstefano_zampini     PetscInt       ncr,rst;
1674b68353e5Sstefano_zampini 
1675b68353e5Sstefano_zampini     ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr);
1676b68353e5Sstefano_zampini     ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr);
1677b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1678b68353e5Sstefano_zampini       if (aii[i*nest->nc+j]) {
1679b68353e5Sstefano_zampini         PetscScalar *nvv = avv[i*nest->nc+j];
1680b68353e5Sstefano_zampini         PetscInt    *nii = aii[i*nest->nc+j];
1681b68353e5Sstefano_zampini         PetscInt    *njj = ajj[i*nest->nc+j];
1682b68353e5Sstefano_zampini         PetscInt    ir,cst;
1683b68353e5Sstefano_zampini 
1684b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr);
1685b68353e5Sstefano_zampini         for (ir=rst; ir<ncr+rst; ++ir) {
1686b68353e5Sstefano_zampini           PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir];
1687b68353e5Sstefano_zampini 
1688b68353e5Sstefano_zampini           for (ij=0;ij<rsize;ij++) {
1689b68353e5Sstefano_zampini             jj[ist+ij] = *njj+cst;
1690b68353e5Sstefano_zampini             vv[ist+ij] = *nvv;
1691b68353e5Sstefano_zampini             njj++;
1692b68353e5Sstefano_zampini             nvv++;
1693b68353e5Sstefano_zampini           }
1694b68353e5Sstefano_zampini           ci[ir] += rsize;
1695b68353e5Sstefano_zampini           nii++;
1696b68353e5Sstefano_zampini         }
1697b68353e5Sstefano_zampini       }
1698b68353e5Sstefano_zampini     }
1699b68353e5Sstefano_zampini   }
1700b68353e5Sstefano_zampini   ierr = PetscFree(ci);CHKERRQ(ierr);
1701b68353e5Sstefano_zampini 
1702b68353e5Sstefano_zampini   /* restore info */
1703b68353e5Sstefano_zampini   for (i=0; i<nest->nr; ++i) {
1704b68353e5Sstefano_zampini     for (j=0; j<nest->nc; ++j) {
1705b68353e5Sstefano_zampini       Mat B = nest->m[i][j];
1706b68353e5Sstefano_zampini       if (B) {
1707b68353e5Sstefano_zampini         PetscInt nnr = 0, k = i*nest->nc+j;
170823875855Sstefano_zampini 
170923875855Sstefano_zampini         B    = (trans[k] ? trans[k] : B);
1710b68353e5Sstefano_zampini         ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr);
1711b68353e5Sstefano_zampini         if (!done) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ");
1712b68353e5Sstefano_zampini         ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr);
171323875855Sstefano_zampini         ierr = MatDestroy(&trans[k]);CHKERRQ(ierr);
1714b68353e5Sstefano_zampini       }
1715b68353e5Sstefano_zampini     }
1716b68353e5Sstefano_zampini   }
171723875855Sstefano_zampini   ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr);
1718b68353e5Sstefano_zampini 
1719b68353e5Sstefano_zampini   /* finalize newmat */
1720b68353e5Sstefano_zampini   if (reuse == MAT_INITIAL_MATRIX) {
1721b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr);
1722b68353e5Sstefano_zampini   } else if (reuse == MAT_INPLACE_MATRIX) {
1723b68353e5Sstefano_zampini     Mat B;
1724b68353e5Sstefano_zampini 
1725b68353e5Sstefano_zampini     ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr);
1726b68353e5Sstefano_zampini     ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr);
1727b68353e5Sstefano_zampini   }
1728b68353e5Sstefano_zampini   ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1729b68353e5Sstefano_zampini   ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1730b68353e5Sstefano_zampini   {
1731b68353e5Sstefano_zampini     Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data);
1732b68353e5Sstefano_zampini     a->free_a     = PETSC_TRUE;
1733b68353e5Sstefano_zampini     a->free_ij    = PETSC_TRUE;
1734b68353e5Sstefano_zampini   }
1735b68353e5Sstefano_zampini   PetscFunctionReturn(0);
1736b68353e5Sstefano_zampini }
1737b68353e5Sstefano_zampini 
1738cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat)
1739629c3df2SDmitry Karpeev {
1740629c3df2SDmitry Karpeev   PetscErrorCode ierr;
1741629c3df2SDmitry Karpeev   Mat_Nest       *nest = (Mat_Nest*)A->data;
174283b1a929SMark Adams   PetscInt       m,n,M,N,i,j,k,*dnnz,*onnz,rstart;
1743649b366bSFande Kong   PetscInt       cstart,cend;
1744b68353e5Sstefano_zampini   PetscMPIInt    size;
1745629c3df2SDmitry Karpeev   Mat            C;
1746629c3df2SDmitry Karpeev 
1747629c3df2SDmitry Karpeev   PetscFunctionBegin;
1748b68353e5Sstefano_zampini   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRQ(ierr);
1749b68353e5Sstefano_zampini   if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */
1750b68353e5Sstefano_zampini     PetscInt  nf;
1751b68353e5Sstefano_zampini     PetscBool fast;
1752b68353e5Sstefano_zampini 
1753b68353e5Sstefano_zampini     ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr);
1754b68353e5Sstefano_zampini     if (!fast) {
1755b68353e5Sstefano_zampini       ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr);
1756b68353e5Sstefano_zampini     }
1757b68353e5Sstefano_zampini     for (i=0; i<nest->nr && fast; ++i) {
1758b68353e5Sstefano_zampini       for (j=0; j<nest->nc && fast; ++j) {
1759b68353e5Sstefano_zampini         Mat B = nest->m[i][j];
1760b68353e5Sstefano_zampini         if (B) {
1761b68353e5Sstefano_zampini           ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr);
176223875855Sstefano_zampini           if (!fast) {
176323875855Sstefano_zampini             PetscBool istrans;
176423875855Sstefano_zampini 
176523875855Sstefano_zampini             ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr);
176623875855Sstefano_zampini             if (istrans) {
176723875855Sstefano_zampini               Mat Bt;
176823875855Sstefano_zampini 
176923875855Sstefano_zampini               ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr);
177023875855Sstefano_zampini               ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr);
177123875855Sstefano_zampini             }
1772b68353e5Sstefano_zampini           }
1773b68353e5Sstefano_zampini         }
1774b68353e5Sstefano_zampini       }
1775b68353e5Sstefano_zampini     }
1776b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nr && fast; ++i) {
1777b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1778b68353e5Sstefano_zampini       if (fast) {
1779b68353e5Sstefano_zampini         PetscInt f,s;
1780b68353e5Sstefano_zampini 
1781b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr);
1782b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1783b68353e5Sstefano_zampini         else {
1784b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr);
1785b68353e5Sstefano_zampini           nf  += f;
1786b68353e5Sstefano_zampini         }
1787b68353e5Sstefano_zampini       }
1788b68353e5Sstefano_zampini     }
1789b68353e5Sstefano_zampini     for (i=0, nf=0; i<nest->nc && fast; ++i) {
1790b68353e5Sstefano_zampini       ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr);
1791b68353e5Sstefano_zampini       if (fast) {
1792b68353e5Sstefano_zampini         PetscInt f,s;
1793b68353e5Sstefano_zampini 
1794b68353e5Sstefano_zampini         ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr);
1795b68353e5Sstefano_zampini         if (f != nf || s != 1) { fast = PETSC_FALSE; }
1796b68353e5Sstefano_zampini         else {
1797b68353e5Sstefano_zampini           ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr);
1798b68353e5Sstefano_zampini           nf  += f;
1799b68353e5Sstefano_zampini         }
1800b68353e5Sstefano_zampini       }
1801b68353e5Sstefano_zampini     }
1802b68353e5Sstefano_zampini     if (fast) {
1803b68353e5Sstefano_zampini       ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr);
1804b68353e5Sstefano_zampini       PetscFunctionReturn(0);
1805b68353e5Sstefano_zampini     }
1806b68353e5Sstefano_zampini   }
1807629c3df2SDmitry Karpeev   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
1808629c3df2SDmitry Karpeev   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
1809649b366bSFande Kong   ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr);
1810629c3df2SDmitry Karpeev   switch (reuse) {
1811629c3df2SDmitry Karpeev   case MAT_INITIAL_MATRIX:
1812ce94432eSBarry Smith     ierr    = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
1813629c3df2SDmitry Karpeev     ierr    = MatSetType(C,newtype);CHKERRQ(ierr);
1814629c3df2SDmitry Karpeev     ierr    = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr);
1815629c3df2SDmitry Karpeev     *newmat = C;
1816629c3df2SDmitry Karpeev     break;
1817629c3df2SDmitry Karpeev   case MAT_REUSE_MATRIX:
1818629c3df2SDmitry Karpeev     C = *newmat;
1819629c3df2SDmitry Karpeev     break;
1820ce94432eSBarry Smith   default: SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MatReuse");
1821629c3df2SDmitry Karpeev   }
1822785e854fSJed Brown   ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr);
1823629c3df2SDmitry Karpeev   onnz = dnnz + m;
1824629c3df2SDmitry Karpeev   for (k=0; k<m; k++) {
1825629c3df2SDmitry Karpeev     dnnz[k] = 0;
1826629c3df2SDmitry Karpeev     onnz[k] = 0;
1827629c3df2SDmitry Karpeev   }
1828629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
1829629c3df2SDmitry Karpeev     IS             bNis;
1830629c3df2SDmitry Karpeev     PetscInt       bN;
1831629c3df2SDmitry Karpeev     const PetscInt *bNindices;
1832629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
1833629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
1834629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr);
1835629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
1836629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
1837629c3df2SDmitry Karpeev       PetscSF        bmsf;
1838649b366bSFande Kong       PetscSFNode    *iremote;
1839629c3df2SDmitry Karpeev       Mat            B;
1840649b366bSFande Kong       PetscInt       bm, *sub_dnnz,*sub_onnz, br;
1841629c3df2SDmitry Karpeev       const PetscInt *bmindices;
1842629c3df2SDmitry Karpeev       B = nest->m[i][j];
1843629c3df2SDmitry Karpeev       if (!B) continue;
1844629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
1845629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
1846ce94432eSBarry Smith       ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr);
1847649b366bSFande Kong       ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr);
1848649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr);
1849649b366bSFande Kong       ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr);
1850649b366bSFande Kong       for (k = 0; k < bm; ++k){
1851649b366bSFande Kong     	sub_dnnz[k] = 0;
1852649b366bSFande Kong     	sub_onnz[k] = 0;
1853649b366bSFande Kong       }
1854629c3df2SDmitry Karpeev       /*
1855629c3df2SDmitry Karpeev        Locate the owners for all of the locally-owned global row indices for this row block.
1856629c3df2SDmitry Karpeev        These determine the roots of PetscSF used to communicate preallocation data to row owners.
1857629c3df2SDmitry Karpeev        The roots correspond to the dnnz and onnz entries; thus, there are two roots per row.
1858629c3df2SDmitry Karpeev        */
185983b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
1860629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
1861131c27b5Sprj-         PetscInt       row = bmindices[br], brncols, col;
1862629c3df2SDmitry Karpeev         const PetscInt *brcols;
1863a4b3d3acSMatthew G Knepley         PetscInt       rowrel = 0; /* row's relative index on its owner rank */
1864131c27b5Sprj-         PetscMPIInt    rowowner = 0;
1865629c3df2SDmitry Karpeev         ierr      = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr);
1866649b366bSFande Kong         /* how many roots  */
1867649b366bSFande Kong         iremote[br].rank = rowowner; iremote[br].index = rowrel;           /* edge from bmdnnz to dnnz */
1868649b366bSFande Kong         /* get nonzero pattern */
186983b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
1870629c3df2SDmitry Karpeev         for (k=0; k<brncols; k++) {
1871629c3df2SDmitry Karpeev           col  = bNindices[brcols[k]];
1872649b366bSFande Kong           if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) {
1873649b366bSFande Kong             sub_dnnz[br]++;
1874649b366bSFande Kong           } else {
1875649b366bSFande Kong             sub_onnz[br]++;
1876649b366bSFande Kong           }
1877629c3df2SDmitry Karpeev         }
187883b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr);
1879629c3df2SDmitry Karpeev       }
1880629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
1881629c3df2SDmitry Karpeev       /* bsf will have to take care of disposing of bedges. */
1882649b366bSFande Kong       ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr);
1883649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
1884649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr);
1885649b366bSFande Kong       ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
1886649b366bSFande Kong       ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr);
1887649b366bSFande Kong       ierr = PetscFree(sub_dnnz);CHKERRQ(ierr);
1888649b366bSFande Kong       ierr = PetscFree(sub_onnz);CHKERRQ(ierr);
1889629c3df2SDmitry Karpeev       ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr);
1890629c3df2SDmitry Karpeev     }
189122d28d08SBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
1892629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
189365a4a0a3Sstefano_zampini   }
189465a4a0a3Sstefano_zampini   /* Resize preallocation if overestimated */
189565a4a0a3Sstefano_zampini   for (i=0;i<m;i++) {
189665a4a0a3Sstefano_zampini     dnnz[i] = PetscMin(dnnz[i],A->cmap->n);
189765a4a0a3Sstefano_zampini     onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n);
1898629c3df2SDmitry Karpeev   }
1899629c3df2SDmitry Karpeev   ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr);
1900629c3df2SDmitry Karpeev   ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr);
1901629c3df2SDmitry Karpeev   ierr = PetscFree(dnnz);CHKERRQ(ierr);
1902629c3df2SDmitry Karpeev 
1903629c3df2SDmitry Karpeev   /* Fill by row */
1904629c3df2SDmitry Karpeev   for (j=0; j<nest->nc; ++j) {
1905629c3df2SDmitry Karpeev     /* Using global column indices and ISAllGather() is not scalable. */
1906629c3df2SDmitry Karpeev     IS             bNis;
1907629c3df2SDmitry Karpeev     PetscInt       bN;
1908629c3df2SDmitry Karpeev     const PetscInt *bNindices;
1909629c3df2SDmitry Karpeev     ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr);
1910629c3df2SDmitry Karpeev     ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr);
1911629c3df2SDmitry Karpeev     ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr);
1912629c3df2SDmitry Karpeev     for (i=0; i<nest->nr; ++i) {
1913629c3df2SDmitry Karpeev       Mat            B;
1914629c3df2SDmitry Karpeev       PetscInt       bm, br;
1915629c3df2SDmitry Karpeev       const PetscInt *bmindices;
1916629c3df2SDmitry Karpeev       B = nest->m[i][j];
1917629c3df2SDmitry Karpeev       if (!B) continue;
1918629c3df2SDmitry Karpeev       ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr);
1919629c3df2SDmitry Karpeev       ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
192083b1a929SMark Adams       ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr);
1921629c3df2SDmitry Karpeev       for (br = 0; br < bm; ++br) {
1922629c3df2SDmitry Karpeev         PetscInt          row = bmindices[br], brncols,  *cols;
1923629c3df2SDmitry Karpeev         const PetscInt    *brcols;
1924629c3df2SDmitry Karpeev         const PetscScalar *brcoldata;
192583b1a929SMark Adams         ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
1926785e854fSJed Brown         ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr);
192726fbe8dcSKarl Rupp         for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]];
1928629c3df2SDmitry Karpeev         /*
1929629c3df2SDmitry Karpeev           Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match.
1930629c3df2SDmitry Karpeev           Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES.
1931629c3df2SDmitry Karpeev          */
1932a2ea699eSBarry Smith         ierr = MatSetValues(C,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr);
193383b1a929SMark Adams         ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr);
1934629c3df2SDmitry Karpeev         ierr = PetscFree(cols);CHKERRQ(ierr);
1935629c3df2SDmitry Karpeev       }
1936629c3df2SDmitry Karpeev       ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr);
1937629c3df2SDmitry Karpeev     }
1938a2ea699eSBarry Smith     ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr);
1939629c3df2SDmitry Karpeev     ierr = ISDestroy(&bNis);CHKERRQ(ierr);
1940629c3df2SDmitry Karpeev   }
1941629c3df2SDmitry Karpeev   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1942629c3df2SDmitry Karpeev   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1943629c3df2SDmitry Karpeev   PetscFunctionReturn(0);
1944629c3df2SDmitry Karpeev }
1945629c3df2SDmitry Karpeev 
19468b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has)
19478b7d3b4bSBarry Smith {
19488b7d3b4bSBarry Smith   Mat_Nest       *bA = (Mat_Nest*)mat->data;
19498b7d3b4bSBarry Smith   PetscInt       i,j,nr = bA->nr,nc = bA->nc;
19508b7d3b4bSBarry Smith   PetscBool      flg;
195152c5f739Sprj-   PetscErrorCode ierr;
195252c5f739Sprj-   PetscFunctionBegin;
19538b7d3b4bSBarry Smith 
195452c5f739Sprj-   *has = PETSC_FALSE;
195552c5f739Sprj-   if (op == MATOP_MULT_TRANSPOSE || op == MATOP_MAT_MULT) {
19568b7d3b4bSBarry Smith     for (j=0; j<nc; j++) {
19578b7d3b4bSBarry Smith       for (i=0; i<nr; i++) {
19588b7d3b4bSBarry Smith         if (!bA->m[i][j]) continue;
195952c5f739Sprj-         ierr = MatHasOperation(bA->m[i][j],op,&flg);CHKERRQ(ierr);
19608b7d3b4bSBarry Smith         if (!flg) PetscFunctionReturn(0);
19618b7d3b4bSBarry Smith       }
19628b7d3b4bSBarry Smith     }
19638b7d3b4bSBarry Smith   }
196452c5f739Sprj-   if (((void**)mat->ops)[op] || (op == MATOP_MAT_MULT && flg)) *has = PETSC_TRUE;
19658b7d3b4bSBarry Smith   PetscFunctionReturn(0);
19668b7d3b4bSBarry Smith }
19678b7d3b4bSBarry Smith 
1968659c6bb0SJed Brown /*MC
1969659c6bb0SJed Brown   MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately.
1970659c6bb0SJed Brown 
1971659c6bb0SJed Brown   Level: intermediate
1972659c6bb0SJed Brown 
1973659c6bb0SJed Brown   Notes:
1974659c6bb0SJed Brown   This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices.
1975659c6bb0SJed Brown   It allows the use of symmetric and block formats for parts of multi-physics simulations.
1976950540a4SJed Brown   It is usually used with DMComposite and DMCreateMatrix()
1977659c6bb0SJed Brown 
19788b7d3b4bSBarry Smith   Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero
19798b7d3b4bSBarry Smith   rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes
19808b7d3b4bSBarry Smith   than the nest matrix.
19818b7d3b4bSBarry Smith 
1982*79798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(),
1983*79798668SBarry Smith           VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(),
1984*79798668SBarry Smith           MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats()
1985659c6bb0SJed Brown M*/
19868cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A)
1987c8883902SJed Brown {
1988c8883902SJed Brown   Mat_Nest       *s;
1989c8883902SJed Brown   PetscErrorCode ierr;
1990c8883902SJed Brown 
1991c8883902SJed Brown   PetscFunctionBegin;
1992b00a9115SJed Brown   ierr    = PetscNewLog(A,&s);CHKERRQ(ierr);
1993c8883902SJed Brown   A->data = (void*)s;
1994e7c19651SJed Brown 
1995e7c19651SJed Brown   s->nr            = -1;
1996e7c19651SJed Brown   s->nc            = -1;
19970298fd71SBarry Smith   s->m             = NULL;
1998e7c19651SJed Brown   s->splitassembly = PETSC_FALSE;
1999c8883902SJed Brown 
2000c8883902SJed Brown   ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr);
200126fbe8dcSKarl Rupp 
2002c8883902SJed Brown   A->ops->mult                  = MatMult_Nest;
20039194d70fSJed Brown   A->ops->multadd               = MatMultAdd_Nest;
2004c8883902SJed Brown   A->ops->multtranspose         = MatMultTranspose_Nest;
20059194d70fSJed Brown   A->ops->multtransposeadd      = MatMultTransposeAdd_Nest;
2006f8170845SAlex Fikl   A->ops->transpose             = MatTranspose_Nest;
2007c8883902SJed Brown   A->ops->assemblybegin         = MatAssemblyBegin_Nest;
2008c8883902SJed Brown   A->ops->assemblyend           = MatAssemblyEnd_Nest;
2009c8883902SJed Brown   A->ops->zeroentries           = MatZeroEntries_Nest;
2010c222c20dSDavid Ham   A->ops->copy                  = MatCopy_Nest;
20116e76ffeaSPierre Jolivet   A->ops->axpy                  = MatAXPY_Nest;
2012c8883902SJed Brown   A->ops->duplicate             = MatDuplicate_Nest;
20137dae84e0SHong Zhang   A->ops->createsubmatrix       = MatCreateSubMatrix_Nest;
2014c8883902SJed Brown   A->ops->destroy               = MatDestroy_Nest;
2015c8883902SJed Brown   A->ops->view                  = MatView_Nest;
2016c8883902SJed Brown   A->ops->getvecs               = 0; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */
2017c8883902SJed Brown   A->ops->getlocalsubmatrix     = MatGetLocalSubMatrix_Nest;
2018c8883902SJed Brown   A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest;
2019429bac76SJed Brown   A->ops->getdiagonal           = MatGetDiagonal_Nest;
2020429bac76SJed Brown   A->ops->diagonalscale         = MatDiagonalScale_Nest;
2021a061e289SJed Brown   A->ops->scale                 = MatScale_Nest;
2022a061e289SJed Brown   A->ops->shift                 = MatShift_Nest;
202313135bc6SAlex Fikl   A->ops->diagonalset           = MatDiagonalSet_Nest;
2024f8170845SAlex Fikl   A->ops->setrandom             = MatSetRandom_Nest;
20258b7d3b4bSBarry Smith   A->ops->hasoperation          = MatHasOperation_Nest;
2026c8883902SJed Brown 
2027c8883902SJed Brown   A->spptr        = 0;
2028c8883902SJed Brown   A->assembled    = PETSC_FALSE;
2029c8883902SJed Brown 
2030c8883902SJed Brown   /* expose Nest api's */
2031bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",        MatNestGetSubMat_Nest);CHKERRQ(ierr);
2032bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",        MatNestSetSubMat_Nest);CHKERRQ(ierr);
2033bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",       MatNestGetSubMats_Nest);CHKERRQ(ierr);
2034bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",          MatNestGetSize_Nest);CHKERRQ(ierr);
2035bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",           MatNestGetISs_Nest);CHKERRQ(ierr);
2036bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",      MatNestGetLocalISs_Nest);CHKERRQ(ierr);
2037bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",       MatNestSetVecType_Nest);CHKERRQ(ierr);
2038bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",       MatNestSetSubMats_Nest);CHKERRQ(ierr);
20390899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
20400899c546SStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",  MatConvert_Nest_AIJ);CHKERRQ(ierr);
204183b1a929SMark Adams   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",     MatConvert_Nest_AIJ);CHKERRQ(ierr);
20425e3038f0Sstefano_zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",      MatConvert_Nest_IS);CHKERRQ(ierr);
204352c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_mpidense_C",MatMatMult_Nest_Dense);CHKERRQ(ierr);
204452c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_seqdense_C",MatMatMult_Nest_Dense);CHKERRQ(ierr);
204552c5f739Sprj-   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMatMult_nest_dense_C",   MatMatMult_Nest_Dense);CHKERRQ(ierr);
2046c8883902SJed Brown 
2047c8883902SJed Brown   ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr);
2048c8883902SJed Brown   PetscFunctionReturn(0);
2049c8883902SJed Brown }
2050