1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I "petscmat.h" I*/ 2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h> 30c312b8eSJed Brown #include <petscsf.h> 4d8588912SDave May 5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat,PetscInt,const IS[],PetscInt,const IS[]); 606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat,Vec*,Vec*); 706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat); 806a1af2fSStefano Zampini 95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat,MatType,MatReuse,Mat*); 10c8883902SJed Brown 11d8588912SDave May /* private functions */ 128188e55aSJed Brown static PetscErrorCode MatNestGetSizes_Private(Mat A,PetscInt *m,PetscInt *n,PetscInt *M,PetscInt *N) 13d8588912SDave May { 14d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 158188e55aSJed Brown PetscInt i,j; 16d8588912SDave May PetscErrorCode ierr; 17d8588912SDave May 18d8588912SDave May PetscFunctionBegin; 198188e55aSJed Brown *m = *n = *M = *N = 0; 208188e55aSJed Brown for (i=0; i<bA->nr; i++) { /* rows */ 218188e55aSJed Brown PetscInt sm,sM; 228188e55aSJed Brown ierr = ISGetLocalSize(bA->isglobal.row[i],&sm);CHKERRQ(ierr); 238188e55aSJed Brown ierr = ISGetSize(bA->isglobal.row[i],&sM);CHKERRQ(ierr); 248188e55aSJed Brown *m += sm; 258188e55aSJed Brown *M += sM; 26d8588912SDave May } 278188e55aSJed Brown for (j=0; j<bA->nc; j++) { /* cols */ 288188e55aSJed Brown PetscInt sn,sN; 298188e55aSJed Brown ierr = ISGetLocalSize(bA->isglobal.col[j],&sn);CHKERRQ(ierr); 308188e55aSJed Brown ierr = ISGetSize(bA->isglobal.col[j],&sN);CHKERRQ(ierr); 318188e55aSJed Brown *n += sn; 328188e55aSJed Brown *N += sN; 33d8588912SDave May } 34d8588912SDave May PetscFunctionReturn(0); 35d8588912SDave May } 36d8588912SDave May 37d8588912SDave May /* operations */ 38207556f9SJed Brown static PetscErrorCode MatMult_Nest(Mat A,Vec x,Vec y) 39d8588912SDave May { 40d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 41207556f9SJed Brown Vec *bx = bA->right,*by = bA->left; 42207556f9SJed Brown PetscInt i,j,nr = bA->nr,nc = bA->nc; 43d8588912SDave May PetscErrorCode ierr; 44d8588912SDave May 45d8588912SDave May PetscFunctionBegin; 46207556f9SJed Brown for (i=0; i<nr; i++) {ierr = VecGetSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);} 47207556f9SJed Brown for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);} 48207556f9SJed Brown for (i=0; i<nr; i++) { 49d8588912SDave May ierr = VecZeroEntries(by[i]);CHKERRQ(ierr); 50207556f9SJed Brown for (j=0; j<nc; j++) { 51207556f9SJed Brown if (!bA->m[i][j]) continue; 52d8588912SDave May /* y[i] <- y[i] + A[i][j] * x[j] */ 53d8588912SDave May ierr = MatMultAdd(bA->m[i][j],bx[j],by[i],by[i]);CHKERRQ(ierr); 54d8588912SDave May } 55d8588912SDave May } 56207556f9SJed Brown for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by[i]);CHKERRQ(ierr);} 57207556f9SJed Brown for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);} 58d8588912SDave May PetscFunctionReturn(0); 59d8588912SDave May } 60d8588912SDave May 619194d70fSJed Brown static PetscErrorCode MatMultAdd_Nest(Mat A,Vec x,Vec y,Vec z) 629194d70fSJed Brown { 639194d70fSJed Brown Mat_Nest *bA = (Mat_Nest*)A->data; 649194d70fSJed Brown Vec *bx = bA->right,*bz = bA->left; 659194d70fSJed Brown PetscInt i,j,nr = bA->nr,nc = bA->nc; 669194d70fSJed Brown PetscErrorCode ierr; 679194d70fSJed Brown 689194d70fSJed Brown PetscFunctionBegin; 699194d70fSJed Brown for (i=0; i<nr; i++) {ierr = VecGetSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);} 709194d70fSJed Brown for (i=0; i<nc; i++) {ierr = VecGetSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);} 719194d70fSJed Brown for (i=0; i<nr; i++) { 729194d70fSJed Brown if (y != z) { 739194d70fSJed Brown Vec by; 749194d70fSJed Brown ierr = VecGetSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr); 759194d70fSJed Brown ierr = VecCopy(by,bz[i]);CHKERRQ(ierr); 76336d21e7SJed Brown ierr = VecRestoreSubVector(y,bA->isglobal.row[i],&by);CHKERRQ(ierr); 779194d70fSJed Brown } 789194d70fSJed Brown for (j=0; j<nc; j++) { 799194d70fSJed Brown if (!bA->m[i][j]) continue; 809194d70fSJed Brown /* y[i] <- y[i] + A[i][j] * x[j] */ 819194d70fSJed Brown ierr = MatMultAdd(bA->m[i][j],bx[j],bz[i],bz[i]);CHKERRQ(ierr); 829194d70fSJed Brown } 839194d70fSJed Brown } 849194d70fSJed Brown for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.row[i],&bz[i]);CHKERRQ(ierr);} 859194d70fSJed Brown for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.col[i],&bx[i]);CHKERRQ(ierr);} 869194d70fSJed Brown PetscFunctionReturn(0); 879194d70fSJed Brown } 889194d70fSJed Brown 8952c5f739Sprj- typedef struct { 9052c5f739Sprj- Mat *workC; /* array of Mat with specific containers depending on the underlying MatMatMult implementation */ 9152c5f739Sprj- PetscScalar *tarray; /* buffer for storing all temporary products A[i][j] B[j] */ 9252c5f739Sprj- PetscInt *dm,*dn,k; /* displacements and number of submatrices */ 9352c5f739Sprj- } Nest_Dense; 9452c5f739Sprj- 956718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductNumeric_Nest_Dense(Mat C) 9652c5f739Sprj- { 976718818eSStefano Zampini Mat_Nest *bA; 9852c5f739Sprj- Nest_Dense *contents; 996718818eSStefano Zampini Mat viewB,viewC,productB,workC; 10052c5f739Sprj- const PetscScalar *barray; 10152c5f739Sprj- PetscScalar *carray; 1026718818eSStefano Zampini PetscInt i,j,M,N,nr,nc,ldb,ldc; 10352c5f739Sprj- PetscErrorCode ierr; 1046718818eSStefano Zampini Mat A,B; 10552c5f739Sprj- 10652c5f739Sprj- PetscFunctionBegin; 1076718818eSStefano Zampini MatCheckProduct(C,3); 1086718818eSStefano Zampini A = C->product->A; 1096718818eSStefano Zampini B = C->product->B; 1106718818eSStefano Zampini ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr); 1116718818eSStefano Zampini if (!N) { 1126718818eSStefano Zampini ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1136718818eSStefano Zampini ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1146718818eSStefano Zampini PetscFunctionReturn(0); 1156718818eSStefano Zampini } 1166718818eSStefano Zampini contents = (Nest_Dense*)C->product->data; 117*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!contents,PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data empty"); 1186718818eSStefano Zampini bA = (Mat_Nest*)A->data; 1196718818eSStefano Zampini nr = bA->nr; 1206718818eSStefano Zampini nc = bA->nc; 12152c5f739Sprj- ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr); 12252c5f739Sprj- ierr = MatDenseGetLDA(C,&ldc);CHKERRQ(ierr); 12352c5f739Sprj- ierr = MatZeroEntries(C);CHKERRQ(ierr); 12452c5f739Sprj- ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr); 1253d8925e7SStefano Zampini ierr = MatDenseGetArray(C,&carray);CHKERRQ(ierr); 12652c5f739Sprj- for (i=0; i<nr; i++) { 12752c5f739Sprj- ierr = ISGetSize(bA->isglobal.row[i],&M);CHKERRQ(ierr); 12852c5f739Sprj- ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dm[i+1]-contents->dm[i],PETSC_DECIDE,M,N,carray+contents->dm[i],&viewC);CHKERRQ(ierr); 1296718818eSStefano Zampini ierr = MatDenseSetLDA(viewC,ldc);CHKERRQ(ierr); 13052c5f739Sprj- for (j=0; j<nc; j++) { 13152c5f739Sprj- if (!bA->m[i][j]) continue; 13252c5f739Sprj- ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr); 13352c5f739Sprj- ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr); 1346718818eSStefano Zampini ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr); 1354222ddf1SHong Zhang 1364222ddf1SHong Zhang /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */ 1374222ddf1SHong Zhang workC = contents->workC[i*nc + j]; 1384222ddf1SHong Zhang productB = workC->product->B; 1394222ddf1SHong Zhang workC->product->B = viewB; /* use newly created dense matrix viewB */ 1406718818eSStefano Zampini ierr = MatProductNumeric(workC);CHKERRQ(ierr); 14152c5f739Sprj- ierr = MatDestroy(&viewB);CHKERRQ(ierr); 1424222ddf1SHong Zhang workC->product->B = productB; /* resume original B */ 1434222ddf1SHong Zhang 14452c5f739Sprj- /* C[i] <- workC + C[i] */ 14552c5f739Sprj- ierr = MatAXPY(viewC,1.0,contents->workC[i*nc + j],SAME_NONZERO_PATTERN);CHKERRQ(ierr); 14652c5f739Sprj- } 14752c5f739Sprj- ierr = MatDestroy(&viewC);CHKERRQ(ierr); 14852c5f739Sprj- } 1493d8925e7SStefano Zampini ierr = MatDenseRestoreArray(C,&carray);CHKERRQ(ierr); 15052c5f739Sprj- ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr); 1514222ddf1SHong Zhang 1524222ddf1SHong Zhang ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1534222ddf1SHong Zhang ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15452c5f739Sprj- PetscFunctionReturn(0); 15552c5f739Sprj- } 15652c5f739Sprj- 15752c5f739Sprj- PetscErrorCode MatNest_DenseDestroy(void *ctx) 15852c5f739Sprj- { 15952c5f739Sprj- Nest_Dense *contents = (Nest_Dense*)ctx; 16052c5f739Sprj- PetscInt i; 16152c5f739Sprj- PetscErrorCode ierr; 16252c5f739Sprj- 16352c5f739Sprj- PetscFunctionBegin; 16452c5f739Sprj- ierr = PetscFree(contents->tarray);CHKERRQ(ierr); 16552c5f739Sprj- for (i=0; i<contents->k; i++) { 16652c5f739Sprj- ierr = MatDestroy(contents->workC + i);CHKERRQ(ierr); 16752c5f739Sprj- } 16852c5f739Sprj- ierr = PetscFree3(contents->dm,contents->dn,contents->workC);CHKERRQ(ierr); 16952c5f739Sprj- ierr = PetscFree(contents);CHKERRQ(ierr); 17052c5f739Sprj- PetscFunctionReturn(0); 17152c5f739Sprj- } 17252c5f739Sprj- 1736718818eSStefano Zampini PETSC_INTERN PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C) 17452c5f739Sprj- { 1756718818eSStefano Zampini Mat_Nest *bA; 1766718818eSStefano Zampini Mat viewB,workC; 17752c5f739Sprj- const PetscScalar *barray; 1786718818eSStefano Zampini PetscInt i,j,M,N,m,n,nr,nc,maxm = 0,ldb; 1794222ddf1SHong Zhang Nest_Dense *contents=NULL; 1806718818eSStefano Zampini PetscBool cisdense; 18152c5f739Sprj- PetscErrorCode ierr; 1826718818eSStefano Zampini Mat A,B; 1836718818eSStefano Zampini PetscReal fill; 18452c5f739Sprj- 18552c5f739Sprj- PetscFunctionBegin; 1866718818eSStefano Zampini MatCheckProduct(C,4); 187*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(C->product->data,PetscObjectComm((PetscObject)C),PETSC_ERR_PLIB,"Product data not empty"); 1886718818eSStefano Zampini A = C->product->A; 1896718818eSStefano Zampini B = C->product->B; 1906718818eSStefano Zampini fill = C->product->fill; 1916718818eSStefano Zampini bA = (Mat_Nest*)A->data; 1926718818eSStefano Zampini nr = bA->nr; 1936718818eSStefano Zampini nc = bA->nc; 1940572eedcSPierre Jolivet ierr = MatGetLocalSize(C,&m,&n);CHKERRQ(ierr); 1950572eedcSPierre Jolivet ierr = MatGetSize(C,&M,&N);CHKERRQ(ierr); 1960572eedcSPierre Jolivet if (m == PETSC_DECIDE || n == PETSC_DECIDE || M == PETSC_DECIDE || N == PETSC_DECIDE) { 1976718818eSStefano Zampini ierr = MatGetLocalSize(B,NULL,&n);CHKERRQ(ierr); 19852c5f739Sprj- ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr); 19952c5f739Sprj- ierr = MatGetLocalSize(A,&m,NULL);CHKERRQ(ierr); 20052c5f739Sprj- ierr = MatGetSize(A,&M,NULL);CHKERRQ(ierr); 2016718818eSStefano Zampini ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr); 2020572eedcSPierre Jolivet } 2036718818eSStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATMPIDENSE,MATSEQDENSECUDA,MATMPIDENSECUDA,"");CHKERRQ(ierr); 2046718818eSStefano Zampini if (!cisdense) { 2056718818eSStefano Zampini ierr = MatSetType(C,((PetscObject)B)->type_name);CHKERRQ(ierr); 2066718818eSStefano Zampini } 20718992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2086718818eSStefano Zampini if (!N) { 2096718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 2106718818eSStefano Zampini PetscFunctionReturn(0); 21152c5f739Sprj- } 21252c5f739Sprj- 21352c5f739Sprj- ierr = PetscNew(&contents);CHKERRQ(ierr); 2146718818eSStefano Zampini C->product->data = contents; 2156718818eSStefano Zampini C->product->destroy = MatNest_DenseDestroy; 21652c5f739Sprj- ierr = PetscCalloc3(nr+1,&contents->dm,nc+1,&contents->dn,nr*nc,&contents->workC);CHKERRQ(ierr); 21752c5f739Sprj- contents->k = nr*nc; 21852c5f739Sprj- for (i=0; i<nr; i++) { 21952c5f739Sprj- ierr = ISGetLocalSize(bA->isglobal.row[i],contents->dm + i+1);CHKERRQ(ierr); 22052c5f739Sprj- maxm = PetscMax(maxm,contents->dm[i+1]); 22152c5f739Sprj- contents->dm[i+1] += contents->dm[i]; 22252c5f739Sprj- } 22352c5f739Sprj- for (i=0; i<nc; i++) { 22452c5f739Sprj- ierr = ISGetLocalSize(bA->isglobal.col[i],contents->dn + i+1);CHKERRQ(ierr); 22552c5f739Sprj- contents->dn[i+1] += contents->dn[i]; 22652c5f739Sprj- } 22752c5f739Sprj- ierr = PetscMalloc1(maxm*N,&contents->tarray);CHKERRQ(ierr); 22852c5f739Sprj- ierr = MatDenseGetLDA(B,&ldb);CHKERRQ(ierr); 22952c5f739Sprj- ierr = MatGetSize(B,NULL,&N);CHKERRQ(ierr); 23052c5f739Sprj- ierr = MatDenseGetArrayRead(B,&barray);CHKERRQ(ierr); 23152c5f739Sprj- /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */ 23252c5f739Sprj- for (j=0; j<nc; j++) { 23352c5f739Sprj- ierr = ISGetSize(bA->isglobal.col[j],&M);CHKERRQ(ierr); 23452c5f739Sprj- ierr = MatCreateDense(PetscObjectComm((PetscObject)A),contents->dn[j+1]-contents->dn[j],PETSC_DECIDE,M,N,(PetscScalar*)(barray+contents->dn[j]),&viewB);CHKERRQ(ierr); 2356718818eSStefano Zampini ierr = MatDenseSetLDA(viewB,ldb);CHKERRQ(ierr); 23652c5f739Sprj- for (i=0; i<nr; i++) { 23752c5f739Sprj- if (!bA->m[i][j]) continue; 23852c5f739Sprj- /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */ 2394222ddf1SHong Zhang 2404222ddf1SHong Zhang ierr = MatProductCreate(bA->m[i][j],viewB,NULL,&contents->workC[i*nc + j]);CHKERRQ(ierr); 2414222ddf1SHong Zhang workC = contents->workC[i*nc + j]; 2424222ddf1SHong Zhang ierr = MatProductSetType(workC,MATPRODUCT_AB);CHKERRQ(ierr); 2434222ddf1SHong Zhang ierr = MatProductSetAlgorithm(workC,"default");CHKERRQ(ierr); 2444222ddf1SHong Zhang ierr = MatProductSetFill(workC,fill);CHKERRQ(ierr); 2454222ddf1SHong Zhang ierr = MatProductSetFromOptions(workC);CHKERRQ(ierr); 2464222ddf1SHong Zhang ierr = MatProductSymbolic(workC);CHKERRQ(ierr); 2474222ddf1SHong Zhang 2486718818eSStefano Zampini /* since tarray will be shared by all Mat */ 2496718818eSStefano Zampini ierr = MatSeqDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr); 2506718818eSStefano Zampini ierr = MatMPIDenseSetPreallocation(workC,contents->tarray);CHKERRQ(ierr); 25152c5f739Sprj- } 25252c5f739Sprj- ierr = MatDestroy(&viewB);CHKERRQ(ierr); 25352c5f739Sprj- } 25452c5f739Sprj- ierr = MatDenseRestoreArrayRead(B,&barray);CHKERRQ(ierr); 25552c5f739Sprj- 2566718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 25752c5f739Sprj- PetscFunctionReturn(0); 25852c5f739Sprj- } 25952c5f739Sprj- 2604222ddf1SHong Zhang /* --------------------------------------------------------- */ 2614222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_Nest_Dense_AB(Mat C) 2624222ddf1SHong Zhang { 2634222ddf1SHong Zhang PetscFunctionBegin; 2646718818eSStefano Zampini C->ops->productsymbolic = MatProductSymbolic_Nest_Dense; 2654222ddf1SHong Zhang PetscFunctionReturn(0); 2664222ddf1SHong Zhang } 2674222ddf1SHong Zhang 2684222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C) 26952c5f739Sprj- { 27052c5f739Sprj- PetscErrorCode ierr; 2714222ddf1SHong Zhang Mat_Product *product = C->product; 27252c5f739Sprj- 27352c5f739Sprj- PetscFunctionBegin; 2744222ddf1SHong Zhang if (product->type == MATPRODUCT_AB) { 2754222ddf1SHong Zhang ierr = MatProductSetFromOptions_Nest_Dense_AB(C);CHKERRQ(ierr); 2766718818eSStefano Zampini } 27752c5f739Sprj- PetscFunctionReturn(0); 27852c5f739Sprj- } 2794222ddf1SHong Zhang /* --------------------------------------------------------- */ 28052c5f739Sprj- 281207556f9SJed Brown static PetscErrorCode MatMultTranspose_Nest(Mat A,Vec x,Vec y) 282d8588912SDave May { 283d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 284207556f9SJed Brown Vec *bx = bA->left,*by = bA->right; 285207556f9SJed Brown PetscInt i,j,nr = bA->nr,nc = bA->nc; 286d8588912SDave May PetscErrorCode ierr; 287d8588912SDave May 288d8588912SDave May PetscFunctionBegin; 289609e31cbSJed Brown for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);} 290609e31cbSJed Brown for (i=0; i<nc; i++) {ierr = VecGetSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);} 291207556f9SJed Brown for (j=0; j<nc; j++) { 292609e31cbSJed Brown ierr = VecZeroEntries(by[j]);CHKERRQ(ierr); 293609e31cbSJed Brown for (i=0; i<nr; i++) { 2946c75ac25SJed Brown if (!bA->m[i][j]) continue; 295609e31cbSJed Brown /* y[j] <- y[j] + (A[i][j])^T * x[i] */ 296609e31cbSJed Brown ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],by[j],by[j]);CHKERRQ(ierr); 297d8588912SDave May } 298d8588912SDave May } 299609e31cbSJed Brown for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);} 300609e31cbSJed Brown for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(y,bA->isglobal.col[i],&by[i]);CHKERRQ(ierr);} 301d8588912SDave May PetscFunctionReturn(0); 302d8588912SDave May } 303d8588912SDave May 3049194d70fSJed Brown static PetscErrorCode MatMultTransposeAdd_Nest(Mat A,Vec x,Vec y,Vec z) 3059194d70fSJed Brown { 3069194d70fSJed Brown Mat_Nest *bA = (Mat_Nest*)A->data; 3079194d70fSJed Brown Vec *bx = bA->left,*bz = bA->right; 3089194d70fSJed Brown PetscInt i,j,nr = bA->nr,nc = bA->nc; 3099194d70fSJed Brown PetscErrorCode ierr; 3109194d70fSJed Brown 3119194d70fSJed Brown PetscFunctionBegin; 3129194d70fSJed Brown for (i=0; i<nr; i++) {ierr = VecGetSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);} 3139194d70fSJed Brown for (i=0; i<nc; i++) {ierr = VecGetSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);} 3149194d70fSJed Brown for (j=0; j<nc; j++) { 3159194d70fSJed Brown if (y != z) { 3169194d70fSJed Brown Vec by; 3179194d70fSJed Brown ierr = VecGetSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr); 3189194d70fSJed Brown ierr = VecCopy(by,bz[j]);CHKERRQ(ierr); 3199194d70fSJed Brown ierr = VecRestoreSubVector(y,bA->isglobal.col[j],&by);CHKERRQ(ierr); 3209194d70fSJed Brown } 3219194d70fSJed Brown for (i=0; i<nr; i++) { 3226c75ac25SJed Brown if (!bA->m[i][j]) continue; 3239194d70fSJed Brown /* z[j] <- y[j] + (A[i][j])^T * x[i] */ 3249194d70fSJed Brown ierr = MatMultTransposeAdd(bA->m[i][j],bx[i],bz[j],bz[j]);CHKERRQ(ierr); 3259194d70fSJed Brown } 3269194d70fSJed Brown } 3279194d70fSJed Brown for (i=0; i<nr; i++) {ierr = VecRestoreSubVector(x,bA->isglobal.row[i],&bx[i]);CHKERRQ(ierr);} 3289194d70fSJed Brown for (i=0; i<nc; i++) {ierr = VecRestoreSubVector(z,bA->isglobal.col[i],&bz[i]);CHKERRQ(ierr);} 3299194d70fSJed Brown PetscFunctionReturn(0); 3309194d70fSJed Brown } 3319194d70fSJed Brown 332f8170845SAlex Fikl static PetscErrorCode MatTranspose_Nest(Mat A,MatReuse reuse,Mat *B) 333f8170845SAlex Fikl { 334f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest*)A->data, *bC; 335f8170845SAlex Fikl Mat C; 336f8170845SAlex Fikl PetscInt i,j,nr = bA->nr,nc = bA->nc; 337f8170845SAlex Fikl PetscErrorCode ierr; 338f8170845SAlex Fikl 339f8170845SAlex Fikl PetscFunctionBegin; 340*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(reuse == MAT_INPLACE_MATRIX && nr != nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_SIZ,"Square nested matrix only for in-place"); 341f8170845SAlex Fikl 342cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) { 343f8170845SAlex Fikl Mat *subs; 344f8170845SAlex Fikl IS *is_row,*is_col; 345f8170845SAlex Fikl 346f8170845SAlex Fikl ierr = PetscCalloc1(nr * nc,&subs);CHKERRQ(ierr); 347f8170845SAlex Fikl ierr = PetscMalloc2(nr,&is_row,nc,&is_col);CHKERRQ(ierr); 348f8170845SAlex Fikl ierr = MatNestGetISs(A,is_row,is_col);CHKERRQ(ierr); 349cf37664fSBarry Smith if (reuse == MAT_INPLACE_MATRIX) { 350ddeb9bd8SAlex Fikl for (i=0; i<nr; i++) { 351ddeb9bd8SAlex Fikl for (j=0; j<nc; j++) { 352ddeb9bd8SAlex Fikl subs[i + nr * j] = bA->m[i][j]; 353ddeb9bd8SAlex Fikl } 354ddeb9bd8SAlex Fikl } 355ddeb9bd8SAlex Fikl } 356ddeb9bd8SAlex Fikl 357f8170845SAlex Fikl ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nc,is_col,nr,is_row,subs,&C);CHKERRQ(ierr); 358f8170845SAlex Fikl ierr = PetscFree(subs);CHKERRQ(ierr); 3593d994f23SBarry Smith ierr = PetscFree2(is_row,is_col);CHKERRQ(ierr); 360f8170845SAlex Fikl } else { 361f8170845SAlex Fikl C = *B; 362f8170845SAlex Fikl } 363f8170845SAlex Fikl 364f8170845SAlex Fikl bC = (Mat_Nest*)C->data; 365f8170845SAlex Fikl for (i=0; i<nr; i++) { 366f8170845SAlex Fikl for (j=0; j<nc; j++) { 367f8170845SAlex Fikl if (bA->m[i][j]) { 368f8170845SAlex Fikl ierr = MatTranspose(bA->m[i][j], reuse, &(bC->m[j][i]));CHKERRQ(ierr); 369f8170845SAlex Fikl } else { 370f8170845SAlex Fikl bC->m[j][i] = NULL; 371f8170845SAlex Fikl } 372f8170845SAlex Fikl } 373f8170845SAlex Fikl } 374f8170845SAlex Fikl 375cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) { 376f8170845SAlex Fikl *B = C; 377f8170845SAlex Fikl } else { 378f8170845SAlex Fikl ierr = MatHeaderMerge(A, &C);CHKERRQ(ierr); 379f8170845SAlex Fikl } 380f8170845SAlex Fikl PetscFunctionReturn(0); 381f8170845SAlex Fikl } 382f8170845SAlex Fikl 383e2d7f03fSJed Brown static PetscErrorCode MatNestDestroyISList(PetscInt n,IS **list) 384e2d7f03fSJed Brown { 385e2d7f03fSJed Brown PetscErrorCode ierr; 386e2d7f03fSJed Brown IS *lst = *list; 387e2d7f03fSJed Brown PetscInt i; 388e2d7f03fSJed Brown 389e2d7f03fSJed Brown PetscFunctionBegin; 390e2d7f03fSJed Brown if (!lst) PetscFunctionReturn(0); 3916bf464f9SBarry Smith for (i=0; i<n; i++) if (lst[i]) {ierr = ISDestroy(&lst[i]);CHKERRQ(ierr);} 392e2d7f03fSJed Brown ierr = PetscFree(lst);CHKERRQ(ierr); 3930298fd71SBarry Smith *list = NULL; 394e2d7f03fSJed Brown PetscFunctionReturn(0); 395e2d7f03fSJed Brown } 396e2d7f03fSJed Brown 39706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat A) 398d8588912SDave May { 399d8588912SDave May Mat_Nest *vs = (Mat_Nest*)A->data; 400d8588912SDave May PetscInt i,j; 401d8588912SDave May PetscErrorCode ierr; 402d8588912SDave May 403d8588912SDave May PetscFunctionBegin; 404d8588912SDave May /* release the matrices and the place holders */ 405e2d7f03fSJed Brown ierr = MatNestDestroyISList(vs->nr,&vs->isglobal.row);CHKERRQ(ierr); 406e2d7f03fSJed Brown ierr = MatNestDestroyISList(vs->nc,&vs->isglobal.col);CHKERRQ(ierr); 407e2d7f03fSJed Brown ierr = MatNestDestroyISList(vs->nr,&vs->islocal.row);CHKERRQ(ierr); 408e2d7f03fSJed Brown ierr = MatNestDestroyISList(vs->nc,&vs->islocal.col);CHKERRQ(ierr); 409d8588912SDave May 410d8588912SDave May ierr = PetscFree(vs->row_len);CHKERRQ(ierr); 411d8588912SDave May ierr = PetscFree(vs->col_len);CHKERRQ(ierr); 41206a1af2fSStefano Zampini ierr = PetscFree(vs->nnzstate);CHKERRQ(ierr); 413d8588912SDave May 414207556f9SJed Brown ierr = PetscFree2(vs->left,vs->right);CHKERRQ(ierr); 415207556f9SJed Brown 416d8588912SDave May /* release the matrices and the place holders */ 417d8588912SDave May if (vs->m) { 418d8588912SDave May for (i=0; i<vs->nr; i++) { 419d8588912SDave May for (j=0; j<vs->nc; j++) { 4206bf464f9SBarry Smith ierr = MatDestroy(&vs->m[i][j]);CHKERRQ(ierr); 421d8588912SDave May } 422d8588912SDave May ierr = PetscFree(vs->m[i]);CHKERRQ(ierr); 423d8588912SDave May } 424d8588912SDave May ierr = PetscFree(vs->m);CHKERRQ(ierr); 425d8588912SDave May } 42606a1af2fSStefano Zampini 42706a1af2fSStefano Zampini /* restore defaults */ 42806a1af2fSStefano Zampini vs->nr = 0; 42906a1af2fSStefano Zampini vs->nc = 0; 43006a1af2fSStefano Zampini vs->splitassembly = PETSC_FALSE; 43106a1af2fSStefano Zampini PetscFunctionReturn(0); 43206a1af2fSStefano Zampini } 43306a1af2fSStefano Zampini 43406a1af2fSStefano Zampini static PetscErrorCode MatDestroy_Nest(Mat A) 43506a1af2fSStefano Zampini { 43606a1af2fSStefano Zampini PetscErrorCode ierr; 43706a1af2fSStefano Zampini 438362febeeSStefano Zampini PetscFunctionBegin; 43906a1af2fSStefano Zampini ierr = MatReset_Nest(A);CHKERRQ(ierr); 440bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 441be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C",NULL);CHKERRQ(ierr); 442be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C",NULL);CHKERRQ(ierr); 443be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C",NULL);CHKERRQ(ierr); 444be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C",NULL);CHKERRQ(ierr); 445be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C",NULL);CHKERRQ(ierr); 446be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C",NULL);CHKERRQ(ierr); 447be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C",NULL);CHKERRQ(ierr); 448be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C",NULL);CHKERRQ(ierr); 449be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C",NULL);CHKERRQ(ierr); 450be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C",NULL);CHKERRQ(ierr); 451be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C",NULL);CHKERRQ(ierr); 452be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C",NULL);CHKERRQ(ierr); 453be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",NULL);CHKERRQ(ierr); 454be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",NULL);CHKERRQ(ierr); 4554222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",NULL);CHKERRQ(ierr); 4564222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",NULL);CHKERRQ(ierr); 4574222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",NULL);CHKERRQ(ierr); 458d8588912SDave May PetscFunctionReturn(0); 459d8588912SDave May } 460d8588912SDave May 461381b8e50SStefano Zampini static PetscErrorCode MatMissingDiagonal_Nest(Mat mat,PetscBool *missing,PetscInt *dd) 462381b8e50SStefano Zampini { 463381b8e50SStefano Zampini Mat_Nest *vs = (Mat_Nest*)mat->data; 464381b8e50SStefano Zampini PetscInt i; 465381b8e50SStefano Zampini PetscErrorCode ierr; 466381b8e50SStefano Zampini 467381b8e50SStefano Zampini PetscFunctionBegin; 468381b8e50SStefano Zampini if (dd) *dd = 0; 469381b8e50SStefano Zampini if (!vs->nr) { 470381b8e50SStefano Zampini *missing = PETSC_TRUE; 471381b8e50SStefano Zampini PetscFunctionReturn(0); 472381b8e50SStefano Zampini } 473381b8e50SStefano Zampini *missing = PETSC_FALSE; 474381b8e50SStefano Zampini for (i = 0; i < vs->nr && !(*missing); i++) { 475381b8e50SStefano Zampini *missing = PETSC_TRUE; 476381b8e50SStefano Zampini if (vs->m[i][i]) { 477381b8e50SStefano Zampini ierr = MatMissingDiagonal(vs->m[i][i],missing,NULL);CHKERRQ(ierr); 478*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(*missing && dd,PetscObjectComm((PetscObject)mat),PETSC_ERR_SUP,"First missing entry not yet implemented"); 479381b8e50SStefano Zampini } 480381b8e50SStefano Zampini } 481381b8e50SStefano Zampini PetscFunctionReturn(0); 482381b8e50SStefano Zampini } 483381b8e50SStefano Zampini 484207556f9SJed Brown static PetscErrorCode MatAssemblyBegin_Nest(Mat A,MatAssemblyType type) 485d8588912SDave May { 486d8588912SDave May Mat_Nest *vs = (Mat_Nest*)A->data; 487d8588912SDave May PetscInt i,j; 488d8588912SDave May PetscErrorCode ierr; 48906a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 490d8588912SDave May 491d8588912SDave May PetscFunctionBegin; 492d8588912SDave May for (i=0; i<vs->nr; i++) { 493d8588912SDave May for (j=0; j<vs->nc; j++) { 49406a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 495e7c19651SJed Brown if (vs->m[i][j]) { 496e7c19651SJed Brown ierr = MatAssemblyBegin(vs->m[i][j],type);CHKERRQ(ierr); 497e7c19651SJed Brown if (!vs->splitassembly) { 498e7c19651SJed Brown /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested 499e7c19651SJed Brown * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was 500e7c19651SJed Brown * already performing an assembly, but the result would by more complicated and appears to offer less 501e7c19651SJed Brown * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an 502e7c19651SJed Brown * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives". 503e7c19651SJed Brown */ 504e7c19651SJed Brown ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr); 50506a1af2fSStefano Zampini ierr = MatGetNonzeroState(vs->m[i][j],&subnnzstate);CHKERRQ(ierr); 506e7c19651SJed Brown } 507e7c19651SJed Brown } 50806a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i*vs->nc+j] != subnnzstate); 50906a1af2fSStefano Zampini vs->nnzstate[i*vs->nc+j] = subnnzstate; 510d8588912SDave May } 511d8588912SDave May } 51206a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 513d8588912SDave May PetscFunctionReturn(0); 514d8588912SDave May } 515d8588912SDave May 516207556f9SJed Brown static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type) 517d8588912SDave May { 518d8588912SDave May Mat_Nest *vs = (Mat_Nest*)A->data; 519d8588912SDave May PetscInt i,j; 520d8588912SDave May PetscErrorCode ierr; 521d8588912SDave May 522d8588912SDave May PetscFunctionBegin; 523d8588912SDave May for (i=0; i<vs->nr; i++) { 524d8588912SDave May for (j=0; j<vs->nc; j++) { 525e7c19651SJed Brown if (vs->m[i][j]) { 526e7c19651SJed Brown if (vs->splitassembly) { 527e7c19651SJed Brown ierr = MatAssemblyEnd(vs->m[i][j],type);CHKERRQ(ierr); 528e7c19651SJed Brown } 529e7c19651SJed Brown } 530d8588912SDave May } 531d8588912SDave May } 532d8588912SDave May PetscFunctionReturn(0); 533d8588912SDave May } 534d8588912SDave May 535f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A,PetscInt row,Mat *B) 536d8588912SDave May { 537207556f9SJed Brown PetscErrorCode ierr; 538f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 539f349c1fdSJed Brown PetscInt j; 540f349c1fdSJed Brown Mat sub; 541d8588912SDave May 542d8588912SDave May PetscFunctionBegin; 5430298fd71SBarry Smith sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */ 544f349c1fdSJed Brown for (j=0; !sub && j<vs->nc; j++) sub = vs->m[row][j]; 5454994cf47SJed Brown if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);} /* Ensure that the sizes are available */ 546f349c1fdSJed Brown *B = sub; 547f349c1fdSJed Brown PetscFunctionReturn(0); 548d8588912SDave May } 549d8588912SDave May 550f349c1fdSJed Brown static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A,PetscInt col,Mat *B) 551f349c1fdSJed Brown { 552207556f9SJed Brown PetscErrorCode ierr; 553f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 554f349c1fdSJed Brown PetscInt i; 555f349c1fdSJed Brown Mat sub; 556f349c1fdSJed Brown 557f349c1fdSJed Brown PetscFunctionBegin; 5580298fd71SBarry Smith sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */ 559f349c1fdSJed Brown for (i=0; !sub && i<vs->nr; i++) sub = vs->m[i][col]; 5604994cf47SJed Brown if (sub) {ierr = MatSetUp(sub);CHKERRQ(ierr);} /* Ensure that the sizes are available */ 561f349c1fdSJed Brown *B = sub; 562f349c1fdSJed Brown PetscFunctionReturn(0); 563d8588912SDave May } 564d8588912SDave May 56518d228c0SPierre Jolivet static PetscErrorCode MatNestFindISRange(Mat A,PetscInt n,const IS list[],IS is,PetscInt *begin,PetscInt *end) 566f349c1fdSJed Brown { 56718d228c0SPierre Jolivet PetscInt i,j,size,m; 568f349c1fdSJed Brown PetscBool flg; 56918d228c0SPierre Jolivet IS out,concatenate[2]; 57018d228c0SPierre Jolivet PetscErrorCode ierr; 571f349c1fdSJed Brown 572f349c1fdSJed Brown PetscFunctionBegin; 573f349c1fdSJed Brown PetscValidPointer(list,3); 574f349c1fdSJed Brown PetscValidHeaderSpecific(is,IS_CLASSID,4); 57518d228c0SPierre Jolivet if (begin) { 57618d228c0SPierre Jolivet PetscValidIntPointer(begin,5); 57718d228c0SPierre Jolivet *begin = -1; 57818d228c0SPierre Jolivet } 57918d228c0SPierre Jolivet if (end) { 58018d228c0SPierre Jolivet PetscValidIntPointer(end,6); 58118d228c0SPierre Jolivet *end = -1; 58218d228c0SPierre Jolivet } 583f349c1fdSJed Brown for (i=0; i<n; i++) { 584207556f9SJed Brown if (!list[i]) continue; 585320466b0SStefano Zampini ierr = ISEqualUnsorted(list[i],is,&flg);CHKERRQ(ierr); 586f349c1fdSJed Brown if (flg) { 58718d228c0SPierre Jolivet if (begin) *begin = i; 58818d228c0SPierre Jolivet if (end) *end = i+1; 589f349c1fdSJed Brown PetscFunctionReturn(0); 590f349c1fdSJed Brown } 591f349c1fdSJed Brown } 59218d228c0SPierre Jolivet ierr = ISGetSize(is,&size);CHKERRQ(ierr); 59318d228c0SPierre Jolivet for (i=0; i<n-1; i++) { 59418d228c0SPierre Jolivet if (!list[i]) continue; 59518d228c0SPierre Jolivet m = 0; 59618d228c0SPierre Jolivet ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,list+i,&out);CHKERRQ(ierr); 59718d228c0SPierre Jolivet ierr = ISGetSize(out,&m);CHKERRQ(ierr); 59818d228c0SPierre Jolivet for (j=i+2; j<n && m<size; j++) { 59918d228c0SPierre Jolivet if (list[j]) { 60018d228c0SPierre Jolivet concatenate[0] = out; 60118d228c0SPierre Jolivet concatenate[1] = list[j]; 60218d228c0SPierre Jolivet ierr = ISConcatenate(PetscObjectComm((PetscObject)A),2,concatenate,&out);CHKERRQ(ierr); 60318d228c0SPierre Jolivet ierr = ISDestroy(concatenate);CHKERRQ(ierr); 60418d228c0SPierre Jolivet ierr = ISGetSize(out,&m);CHKERRQ(ierr); 60518d228c0SPierre Jolivet } 60618d228c0SPierre Jolivet } 60718d228c0SPierre Jolivet if (m == size) { 60818d228c0SPierre Jolivet ierr = ISEqualUnsorted(out,is,&flg);CHKERRQ(ierr); 60918d228c0SPierre Jolivet if (flg) { 61018d228c0SPierre Jolivet if (begin) *begin = i; 61118d228c0SPierre Jolivet if (end) *end = j; 61218d228c0SPierre Jolivet ierr = ISDestroy(&out);CHKERRQ(ierr); 61318d228c0SPierre Jolivet PetscFunctionReturn(0); 61418d228c0SPierre Jolivet } 61518d228c0SPierre Jolivet } 61618d228c0SPierre Jolivet ierr = ISDestroy(&out);CHKERRQ(ierr); 61718d228c0SPierre Jolivet } 61818d228c0SPierre Jolivet PetscFunctionReturn(0); 619f349c1fdSJed Brown } 620f349c1fdSJed Brown 62118d228c0SPierre Jolivet static PetscErrorCode MatNestFillEmptyMat_Private(Mat A,PetscInt i,PetscInt j,Mat *B) 6228188e55aSJed Brown { 6238188e55aSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 62418d228c0SPierre Jolivet PetscInt lr,lc; 62518d228c0SPierre Jolivet PetscErrorCode ierr; 62618d228c0SPierre Jolivet 62718d228c0SPierre Jolivet PetscFunctionBegin; 62818d228c0SPierre Jolivet ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 62918d228c0SPierre Jolivet ierr = ISGetLocalSize(vs->isglobal.row[i],&lr);CHKERRQ(ierr); 63018d228c0SPierre Jolivet ierr = ISGetLocalSize(vs->isglobal.col[j],&lc);CHKERRQ(ierr); 63118d228c0SPierre Jolivet ierr = MatSetSizes(*B,lr,lc,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 63218d228c0SPierre Jolivet ierr = MatSetType(*B,MATAIJ);CHKERRQ(ierr); 63318d228c0SPierre Jolivet ierr = MatSeqAIJSetPreallocation(*B,0,NULL);CHKERRQ(ierr); 63418d228c0SPierre Jolivet ierr = MatMPIAIJSetPreallocation(*B,0,NULL,0,NULL);CHKERRQ(ierr); 63518d228c0SPierre Jolivet ierr = MatSetUp(*B);CHKERRQ(ierr); 63618d228c0SPierre Jolivet ierr = MatSetOption(*B,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 63718d228c0SPierre Jolivet ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 63818d228c0SPierre Jolivet ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 63918d228c0SPierre Jolivet PetscFunctionReturn(0); 64018d228c0SPierre Jolivet } 64118d228c0SPierre Jolivet 64218d228c0SPierre Jolivet static PetscErrorCode MatNestGetBlock_Private(Mat A,PetscInt rbegin,PetscInt rend,PetscInt cbegin,PetscInt cend,Mat *B) 64318d228c0SPierre Jolivet { 64418d228c0SPierre Jolivet Mat_Nest *vs = (Mat_Nest*)A->data; 64518d228c0SPierre Jolivet Mat *a; 64618d228c0SPierre Jolivet PetscInt i,j,k,l,nr=rend-rbegin,nc=cend-cbegin; 6478188e55aSJed Brown char keyname[256]; 64818d228c0SPierre Jolivet PetscBool *b; 64918d228c0SPierre Jolivet PetscBool flg; 6508188e55aSJed Brown PetscErrorCode ierr; 6518188e55aSJed Brown 6528188e55aSJed Brown PetscFunctionBegin; 6530298fd71SBarry Smith *B = NULL; 654c0aa6a63SJacob Faibussowitsch ierr = PetscSNPrintf(keyname,sizeof(keyname),"NestBlock_%" PetscInt_FMT "-%" PetscInt_FMT "x%" PetscInt_FMT "-%" PetscInt_FMT,rbegin,rend,cbegin,cend);CHKERRQ(ierr); 6558188e55aSJed Brown ierr = PetscObjectQuery((PetscObject)A,keyname,(PetscObject*)B);CHKERRQ(ierr); 6568188e55aSJed Brown if (*B) PetscFunctionReturn(0); 6578188e55aSJed Brown 65818d228c0SPierre Jolivet ierr = PetscMalloc2(nr*nc,&a,nr*nc,&b);CHKERRQ(ierr); 65918d228c0SPierre Jolivet for (i=0; i<nr; i++) { 66018d228c0SPierre Jolivet for (j=0; j<nc; j++) { 66118d228c0SPierre Jolivet a[i*nc + j] = vs->m[rbegin+i][cbegin+j]; 66218d228c0SPierre Jolivet b[i*nc + j] = PETSC_FALSE; 66318d228c0SPierre Jolivet } 66418d228c0SPierre Jolivet } 66518d228c0SPierre Jolivet if (nc!=vs->nc&&nr!=vs->nr) { 66618d228c0SPierre Jolivet for (i=0; i<nr; i++) { 66718d228c0SPierre Jolivet for (j=0; j<nc; j++) { 66818d228c0SPierre Jolivet flg = PETSC_FALSE; 66918d228c0SPierre Jolivet for (k=0; (k<nr&&!flg); k++) { 67018d228c0SPierre Jolivet if (a[j + k*nc]) flg = PETSC_TRUE; 67118d228c0SPierre Jolivet } 67218d228c0SPierre Jolivet if (flg) { 67318d228c0SPierre Jolivet flg = PETSC_FALSE; 67418d228c0SPierre Jolivet for (l=0; (l<nc&&!flg); l++) { 67518d228c0SPierre Jolivet if (a[i*nc + l]) flg = PETSC_TRUE; 67618d228c0SPierre Jolivet } 67718d228c0SPierre Jolivet } 67818d228c0SPierre Jolivet if (!flg) { 67918d228c0SPierre Jolivet b[i*nc + j] = PETSC_TRUE; 68018d228c0SPierre Jolivet ierr = MatNestFillEmptyMat_Private(A,rbegin+i,cbegin+j,a + i*nc + j);CHKERRQ(ierr); 68118d228c0SPierre Jolivet } 68218d228c0SPierre Jolivet } 68318d228c0SPierre Jolivet } 68418d228c0SPierre Jolivet } 68518d228c0SPierre Jolivet ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,nr!=vs->nr?NULL:vs->isglobal.row,nc,nc!=vs->nc?NULL:vs->isglobal.col,a,B);CHKERRQ(ierr); 68618d228c0SPierre Jolivet for (i=0; i<nr; i++) { 68718d228c0SPierre Jolivet for (j=0; j<nc; j++) { 68818d228c0SPierre Jolivet if (b[i*nc + j]) { 68918d228c0SPierre Jolivet ierr = MatDestroy(a + i*nc + j);CHKERRQ(ierr); 69018d228c0SPierre Jolivet } 69118d228c0SPierre Jolivet } 69218d228c0SPierre Jolivet } 69318d228c0SPierre Jolivet ierr = PetscFree2(a,b);CHKERRQ(ierr); 6948188e55aSJed Brown (*B)->assembled = A->assembled; 6958188e55aSJed Brown ierr = PetscObjectCompose((PetscObject)A,keyname,(PetscObject)*B);CHKERRQ(ierr); 6968188e55aSJed Brown ierr = PetscObjectDereference((PetscObject)*B);CHKERRQ(ierr); /* Leave the only remaining reference in the composition */ 6978188e55aSJed Brown PetscFunctionReturn(0); 6988188e55aSJed Brown } 6998188e55aSJed Brown 700f349c1fdSJed Brown static PetscErrorCode MatNestFindSubMat(Mat A,struct MatNestISPair *is,IS isrow,IS iscol,Mat *B) 701f349c1fdSJed Brown { 702f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 70318d228c0SPierre Jolivet PetscInt rbegin,rend,cbegin,cend; 7048188e55aSJed Brown PetscErrorCode ierr; 705f349c1fdSJed Brown 706f349c1fdSJed Brown PetscFunctionBegin; 70718d228c0SPierre Jolivet ierr = MatNestFindISRange(A,vs->nr,is->row,isrow,&rbegin,&rend);CHKERRQ(ierr); 70818d228c0SPierre Jolivet ierr = MatNestFindISRange(A,vs->nc,is->col,iscol,&cbegin,&cend);CHKERRQ(ierr); 70918d228c0SPierre Jolivet if (rend == rbegin + 1 && cend == cbegin + 1) { 71018d228c0SPierre Jolivet if (!vs->m[rbegin][cbegin]) { 71118d228c0SPierre Jolivet ierr = MatNestFillEmptyMat_Private(A,rbegin,cbegin,vs->m[rbegin] + cbegin);CHKERRQ(ierr); 71277019fcaSJed Brown } 71318d228c0SPierre Jolivet *B = vs->m[rbegin][cbegin]; 71418d228c0SPierre Jolivet } else if (rbegin != -1 && cbegin != -1) { 71518d228c0SPierre Jolivet ierr = MatNestGetBlock_Private(A,rbegin,rend,cbegin,cend,B);CHKERRQ(ierr); 71618d228c0SPierre Jolivet } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Could not find index set"); 717f349c1fdSJed Brown PetscFunctionReturn(0); 718f349c1fdSJed Brown } 719f349c1fdSJed Brown 72006a1af2fSStefano Zampini /* 72106a1af2fSStefano Zampini TODO: This does not actually returns a submatrix we can modify 72206a1af2fSStefano Zampini */ 7237dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_Nest(Mat A,IS isrow,IS iscol,MatReuse reuse,Mat *B) 724f349c1fdSJed Brown { 725f349c1fdSJed Brown PetscErrorCode ierr; 726f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 727f349c1fdSJed Brown Mat sub; 728f349c1fdSJed Brown 729f349c1fdSJed Brown PetscFunctionBegin; 730f349c1fdSJed Brown ierr = MatNestFindSubMat(A,&vs->isglobal,isrow,iscol,&sub);CHKERRQ(ierr); 731f349c1fdSJed Brown switch (reuse) { 732f349c1fdSJed Brown case MAT_INITIAL_MATRIX: 7337874fa86SDave May if (sub) { ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr); } 734f349c1fdSJed Brown *B = sub; 735f349c1fdSJed Brown break; 736f349c1fdSJed Brown case MAT_REUSE_MATRIX: 737*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(sub != *B,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Submatrix was not used before in this call"); 738f349c1fdSJed Brown break; 739f349c1fdSJed Brown case MAT_IGNORE_MATRIX: /* Nothing to do */ 740f349c1fdSJed Brown break; 741511c6705SHong Zhang case MAT_INPLACE_MATRIX: /* Nothing to do */ 742511c6705SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"MAT_INPLACE_MATRIX is not supported yet"); 743f349c1fdSJed Brown } 744f349c1fdSJed Brown PetscFunctionReturn(0); 745f349c1fdSJed Brown } 746f349c1fdSJed Brown 747f349c1fdSJed Brown PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B) 748f349c1fdSJed Brown { 749f349c1fdSJed Brown PetscErrorCode ierr; 750f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 751f349c1fdSJed Brown Mat sub; 752f349c1fdSJed Brown 753f349c1fdSJed Brown PetscFunctionBegin; 754f349c1fdSJed Brown ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr); 755f349c1fdSJed Brown /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */ 756f349c1fdSJed Brown if (sub) {ierr = PetscObjectReference((PetscObject)sub);CHKERRQ(ierr);} 757f349c1fdSJed Brown *B = sub; 758d8588912SDave May PetscFunctionReturn(0); 759d8588912SDave May } 760d8588912SDave May 761207556f9SJed Brown static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A,IS isrow,IS iscol,Mat *B) 762d8588912SDave May { 763d8588912SDave May PetscErrorCode ierr; 764f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 765f349c1fdSJed Brown Mat sub; 766d8588912SDave May 767d8588912SDave May PetscFunctionBegin; 768f349c1fdSJed Brown ierr = MatNestFindSubMat(A,&vs->islocal,isrow,iscol,&sub);CHKERRQ(ierr); 769*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(*B != sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has not been gotten"); 770f349c1fdSJed Brown if (sub) { 771*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(((PetscObject)sub)->refct <= 1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Local submatrix has had reference count decremented too many times"); 7726bf464f9SBarry Smith ierr = MatDestroy(B);CHKERRQ(ierr); 773d8588912SDave May } 774d8588912SDave May PetscFunctionReturn(0); 775d8588912SDave May } 776d8588912SDave May 7777874fa86SDave May static PetscErrorCode MatGetDiagonal_Nest(Mat A,Vec v) 7787874fa86SDave May { 7797874fa86SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 7807874fa86SDave May PetscInt i; 7817874fa86SDave May PetscErrorCode ierr; 7827874fa86SDave May 7837874fa86SDave May PetscFunctionBegin; 7847874fa86SDave May for (i=0; i<bA->nr; i++) { 785429bac76SJed Brown Vec bv; 786429bac76SJed Brown ierr = VecGetSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr); 7877874fa86SDave May if (bA->m[i][i]) { 788429bac76SJed Brown ierr = MatGetDiagonal(bA->m[i][i],bv);CHKERRQ(ierr); 7897874fa86SDave May } else { 7905159a857SMatthew G. Knepley ierr = VecSet(bv,0.0);CHKERRQ(ierr); 7917874fa86SDave May } 792429bac76SJed Brown ierr = VecRestoreSubVector(v,bA->isglobal.row[i],&bv);CHKERRQ(ierr); 7937874fa86SDave May } 7947874fa86SDave May PetscFunctionReturn(0); 7957874fa86SDave May } 7967874fa86SDave May 7977874fa86SDave May static PetscErrorCode MatDiagonalScale_Nest(Mat A,Vec l,Vec r) 7987874fa86SDave May { 7997874fa86SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 800429bac76SJed Brown Vec bl,*br; 8017874fa86SDave May PetscInt i,j; 8027874fa86SDave May PetscErrorCode ierr; 8037874fa86SDave May 8047874fa86SDave May PetscFunctionBegin; 8053f800ebeSJed Brown ierr = PetscCalloc1(bA->nc,&br);CHKERRQ(ierr); 8062e6472ebSElliott Sales de Andrade if (r) { 807429bac76SJed Brown for (j=0; j<bA->nc; j++) {ierr = VecGetSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);} 8082e6472ebSElliott Sales de Andrade } 8092e6472ebSElliott Sales de Andrade bl = NULL; 8107874fa86SDave May for (i=0; i<bA->nr; i++) { 8112e6472ebSElliott Sales de Andrade if (l) { 812429bac76SJed Brown ierr = VecGetSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr); 8132e6472ebSElliott Sales de Andrade } 8147874fa86SDave May for (j=0; j<bA->nc; j++) { 8157874fa86SDave May if (bA->m[i][j]) { 816429bac76SJed Brown ierr = MatDiagonalScale(bA->m[i][j],bl,br[j]);CHKERRQ(ierr); 8177874fa86SDave May } 8187874fa86SDave May } 8192e6472ebSElliott Sales de Andrade if (l) { 820a061e289SJed Brown ierr = VecRestoreSubVector(l,bA->isglobal.row[i],&bl);CHKERRQ(ierr); 8217874fa86SDave May } 8222e6472ebSElliott Sales de Andrade } 8232e6472ebSElliott Sales de Andrade if (r) { 824429bac76SJed Brown for (j=0; j<bA->nc; j++) {ierr = VecRestoreSubVector(r,bA->isglobal.col[j],&br[j]);CHKERRQ(ierr);} 8252e6472ebSElliott Sales de Andrade } 826429bac76SJed Brown ierr = PetscFree(br);CHKERRQ(ierr); 8277874fa86SDave May PetscFunctionReturn(0); 8287874fa86SDave May } 8297874fa86SDave May 830a061e289SJed Brown static PetscErrorCode MatScale_Nest(Mat A,PetscScalar a) 831a061e289SJed Brown { 832a061e289SJed Brown Mat_Nest *bA = (Mat_Nest*)A->data; 833a061e289SJed Brown PetscInt i,j; 834a061e289SJed Brown PetscErrorCode ierr; 835a061e289SJed Brown 836a061e289SJed Brown PetscFunctionBegin; 837a061e289SJed Brown for (i=0; i<bA->nr; i++) { 838a061e289SJed Brown for (j=0; j<bA->nc; j++) { 839a061e289SJed Brown if (bA->m[i][j]) { 840a061e289SJed Brown ierr = MatScale(bA->m[i][j],a);CHKERRQ(ierr); 841a061e289SJed Brown } 842a061e289SJed Brown } 843a061e289SJed Brown } 844a061e289SJed Brown PetscFunctionReturn(0); 845a061e289SJed Brown } 846a061e289SJed Brown 847a061e289SJed Brown static PetscErrorCode MatShift_Nest(Mat A,PetscScalar a) 848a061e289SJed Brown { 849a061e289SJed Brown Mat_Nest *bA = (Mat_Nest*)A->data; 850a061e289SJed Brown PetscInt i; 851a061e289SJed Brown PetscErrorCode ierr; 85206a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 853a061e289SJed Brown 854a061e289SJed Brown PetscFunctionBegin; 855a061e289SJed Brown for (i=0; i<bA->nr; i++) { 85606a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 857*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!bA->m[i][i],PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"No support for shifting an empty diagonal block, insert a matrix in block (%" PetscInt_FMT ",%" PetscInt_FMT ")",i,i); 858a061e289SJed Brown ierr = MatShift(bA->m[i][i],a);CHKERRQ(ierr); 85906a1af2fSStefano Zampini ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr); 86006a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate); 86106a1af2fSStefano Zampini bA->nnzstate[i*bA->nc+i] = subnnzstate; 862a061e289SJed Brown } 86306a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 864a061e289SJed Brown PetscFunctionReturn(0); 865a061e289SJed Brown } 866a061e289SJed Brown 86713135bc6SAlex Fikl static PetscErrorCode MatDiagonalSet_Nest(Mat A,Vec D,InsertMode is) 86813135bc6SAlex Fikl { 86913135bc6SAlex Fikl Mat_Nest *bA = (Mat_Nest*)A->data; 87013135bc6SAlex Fikl PetscInt i; 87113135bc6SAlex Fikl PetscErrorCode ierr; 87206a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 87313135bc6SAlex Fikl 87413135bc6SAlex Fikl PetscFunctionBegin; 87513135bc6SAlex Fikl for (i=0; i<bA->nr; i++) { 87606a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 87713135bc6SAlex Fikl Vec bv; 87813135bc6SAlex Fikl ierr = VecGetSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr); 87913135bc6SAlex Fikl if (bA->m[i][i]) { 88013135bc6SAlex Fikl ierr = MatDiagonalSet(bA->m[i][i],bv,is);CHKERRQ(ierr); 88106a1af2fSStefano Zampini ierr = MatGetNonzeroState(bA->m[i][i],&subnnzstate);CHKERRQ(ierr); 88213135bc6SAlex Fikl } 88313135bc6SAlex Fikl ierr = VecRestoreSubVector(D,bA->isglobal.row[i],&bv);CHKERRQ(ierr); 88406a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i*bA->nc+i] != subnnzstate); 88506a1af2fSStefano Zampini bA->nnzstate[i*bA->nc+i] = subnnzstate; 88613135bc6SAlex Fikl } 88706a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 88813135bc6SAlex Fikl PetscFunctionReturn(0); 88913135bc6SAlex Fikl } 89013135bc6SAlex Fikl 891f8170845SAlex Fikl static PetscErrorCode MatSetRandom_Nest(Mat A,PetscRandom rctx) 892f8170845SAlex Fikl { 893f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest*)A->data; 894f8170845SAlex Fikl PetscInt i,j; 895f8170845SAlex Fikl PetscErrorCode ierr; 896f8170845SAlex Fikl 897f8170845SAlex Fikl PetscFunctionBegin; 898f8170845SAlex Fikl for (i=0; i<bA->nr; i++) { 899f8170845SAlex Fikl for (j=0; j<bA->nc; j++) { 900f8170845SAlex Fikl if (bA->m[i][j]) { 901f8170845SAlex Fikl ierr = MatSetRandom(bA->m[i][j],rctx);CHKERRQ(ierr); 902f8170845SAlex Fikl } 903f8170845SAlex Fikl } 904f8170845SAlex Fikl } 905f8170845SAlex Fikl PetscFunctionReturn(0); 906f8170845SAlex Fikl } 907f8170845SAlex Fikl 9082a7a6963SBarry Smith static PetscErrorCode MatCreateVecs_Nest(Mat A,Vec *right,Vec *left) 909d8588912SDave May { 910d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 911d8588912SDave May Vec *L,*R; 912d8588912SDave May MPI_Comm comm; 913d8588912SDave May PetscInt i,j; 914d8588912SDave May PetscErrorCode ierr; 915d8588912SDave May 916d8588912SDave May PetscFunctionBegin; 917ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 918d8588912SDave May if (right) { 919d8588912SDave May /* allocate R */ 920854ce69bSBarry Smith ierr = PetscMalloc1(bA->nc, &R);CHKERRQ(ierr); 921d8588912SDave May /* Create the right vectors */ 922d8588912SDave May for (j=0; j<bA->nc; j++) { 923d8588912SDave May for (i=0; i<bA->nr; i++) { 924d8588912SDave May if (bA->m[i][j]) { 9252a7a6963SBarry Smith ierr = MatCreateVecs(bA->m[i][j],&R[j],NULL);CHKERRQ(ierr); 926d8588912SDave May break; 927d8588912SDave May } 928d8588912SDave May } 929*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(i==bA->nr,PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column."); 930d8588912SDave May } 931f349c1fdSJed Brown ierr = VecCreateNest(comm,bA->nc,bA->isglobal.col,R,right);CHKERRQ(ierr); 932d8588912SDave May /* hand back control to the nest vector */ 933d8588912SDave May for (j=0; j<bA->nc; j++) { 9346bf464f9SBarry Smith ierr = VecDestroy(&R[j]);CHKERRQ(ierr); 935d8588912SDave May } 936d8588912SDave May ierr = PetscFree(R);CHKERRQ(ierr); 937d8588912SDave May } 938d8588912SDave May 939d8588912SDave May if (left) { 940d8588912SDave May /* allocate L */ 941854ce69bSBarry Smith ierr = PetscMalloc1(bA->nr, &L);CHKERRQ(ierr); 942d8588912SDave May /* Create the left vectors */ 943d8588912SDave May for (i=0; i<bA->nr; i++) { 944d8588912SDave May for (j=0; j<bA->nc; j++) { 945d8588912SDave May if (bA->m[i][j]) { 9462a7a6963SBarry Smith ierr = MatCreateVecs(bA->m[i][j],NULL,&L[i]);CHKERRQ(ierr); 947d8588912SDave May break; 948d8588912SDave May } 949d8588912SDave May } 950*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(j==bA->nc,PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row."); 951d8588912SDave May } 952d8588912SDave May 953f349c1fdSJed Brown ierr = VecCreateNest(comm,bA->nr,bA->isglobal.row,L,left);CHKERRQ(ierr); 954d8588912SDave May for (i=0; i<bA->nr; i++) { 9556bf464f9SBarry Smith ierr = VecDestroy(&L[i]);CHKERRQ(ierr); 956d8588912SDave May } 957d8588912SDave May 958d8588912SDave May ierr = PetscFree(L);CHKERRQ(ierr); 959d8588912SDave May } 960d8588912SDave May PetscFunctionReturn(0); 961d8588912SDave May } 962d8588912SDave May 963207556f9SJed Brown static PetscErrorCode MatView_Nest(Mat A,PetscViewer viewer) 964d8588912SDave May { 965d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 96629e60adbSStefano Zampini PetscBool isascii,viewSub = PETSC_FALSE; 967d8588912SDave May PetscInt i,j; 968d8588912SDave May PetscErrorCode ierr; 969d8588912SDave May 970d8588912SDave May PetscFunctionBegin; 971251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr); 972d8588912SDave May if (isascii) { 973d8588912SDave May 97429e60adbSStefano Zampini ierr = PetscOptionsGetBool(((PetscObject)A)->options,((PetscObject)A)->prefix,"-mat_view_nest_sub",&viewSub,NULL);CHKERRQ(ierr); 975d86155a6SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"Matrix object: \n");CHKERRQ(ierr); 976d86155a6SBarry Smith ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 977c0aa6a63SJacob Faibussowitsch ierr = PetscViewerASCIIPrintf(viewer, "type=nest, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT " \n",bA->nr,bA->nc);CHKERRQ(ierr); 978d8588912SDave May 979d86155a6SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MatNest structure: \n");CHKERRQ(ierr); 980d8588912SDave May for (i=0; i<bA->nr; i++) { 981d8588912SDave May for (j=0; j<bA->nc; j++) { 98219fd82e9SBarry Smith MatType type; 983270f95d7SJed Brown char name[256] = "",prefix[256] = ""; 984d8588912SDave May PetscInt NR,NC; 985d8588912SDave May PetscBool isNest = PETSC_FALSE; 986d8588912SDave May 987d8588912SDave May if (!bA->m[i][j]) { 988c0aa6a63SJacob Faibussowitsch ierr = PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : NULL \n",i,j);CHKERRQ(ierr); 989d8588912SDave May continue; 990d8588912SDave May } 991d8588912SDave May ierr = MatGetSize(bA->m[i][j],&NR,&NC);CHKERRQ(ierr); 992d8588912SDave May ierr = MatGetType(bA->m[i][j], &type);CHKERRQ(ierr); 9938caf3d72SBarry Smith if (((PetscObject)bA->m[i][j])->name) {ierr = PetscSNPrintf(name,sizeof(name),"name=\"%s\", ",((PetscObject)bA->m[i][j])->name);CHKERRQ(ierr);} 9948caf3d72SBarry Smith if (((PetscObject)bA->m[i][j])->prefix) {ierr = PetscSNPrintf(prefix,sizeof(prefix),"prefix=\"%s\", ",((PetscObject)bA->m[i][j])->prefix);CHKERRQ(ierr);} 995251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)bA->m[i][j],MATNEST,&isNest);CHKERRQ(ierr); 996d8588912SDave May 997c0aa6a63SJacob Faibussowitsch ierr = PetscViewerASCIIPrintf(viewer,"(%" PetscInt_FMT ",%" PetscInt_FMT ") : %s%stype=%s, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT " \n",i,j,name,prefix,type,NR,NC);CHKERRQ(ierr); 998d8588912SDave May 99929e60adbSStefano Zampini if (isNest || viewSub) { 1000270f95d7SJed Brown ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); /* push1 */ 1001d8588912SDave May ierr = MatView(bA->m[i][j],viewer);CHKERRQ(ierr); 1002270f95d7SJed Brown ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); /* pop1 */ 1003d8588912SDave May } 1004d8588912SDave May } 1005d8588912SDave May } 1006d86155a6SBarry Smith ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); /* pop0 */ 1007d8588912SDave May } 1008d8588912SDave May PetscFunctionReturn(0); 1009d8588912SDave May } 1010d8588912SDave May 1011207556f9SJed Brown static PetscErrorCode MatZeroEntries_Nest(Mat A) 1012d8588912SDave May { 1013d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 1014d8588912SDave May PetscInt i,j; 1015d8588912SDave May PetscErrorCode ierr; 1016d8588912SDave May 1017d8588912SDave May PetscFunctionBegin; 1018d8588912SDave May for (i=0; i<bA->nr; i++) { 1019d8588912SDave May for (j=0; j<bA->nc; j++) { 1020d8588912SDave May if (!bA->m[i][j]) continue; 1021d8588912SDave May ierr = MatZeroEntries(bA->m[i][j]);CHKERRQ(ierr); 1022d8588912SDave May } 1023d8588912SDave May } 1024d8588912SDave May PetscFunctionReturn(0); 1025d8588912SDave May } 1026d8588912SDave May 1027c222c20dSDavid Ham static PetscErrorCode MatCopy_Nest(Mat A,Mat B,MatStructure str) 1028c222c20dSDavid Ham { 1029c222c20dSDavid Ham Mat_Nest *bA = (Mat_Nest*)A->data,*bB = (Mat_Nest*)B->data; 1030c222c20dSDavid Ham PetscInt i,j,nr = bA->nr,nc = bA->nc; 1031c222c20dSDavid Ham PetscErrorCode ierr; 103206a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 1033c222c20dSDavid Ham 1034c222c20dSDavid Ham PetscFunctionBegin; 1035*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != bB->nr || nc != bB->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Cannot copy a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") to a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")",bB->nr,bB->nc,nr,nc); 1036c222c20dSDavid Ham for (i=0; i<nr; i++) { 1037c222c20dSDavid Ham for (j=0; j<nc; j++) { 103806a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 103946a2b97cSJed Brown if (bA->m[i][j] && bB->m[i][j]) { 1040c222c20dSDavid Ham ierr = MatCopy(bA->m[i][j],bB->m[i][j],str);CHKERRQ(ierr); 1041*2c71b3e2SJacob Faibussowitsch } else PetscCheckFalse(bA->m[i][j] || bB->m[i][j],PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT,i,j); 104206a1af2fSStefano Zampini ierr = MatGetNonzeroState(bB->m[i][j],&subnnzstate);CHKERRQ(ierr); 104306a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i*nc+j] != subnnzstate); 104406a1af2fSStefano Zampini bB->nnzstate[i*nc+j] = subnnzstate; 1045c222c20dSDavid Ham } 1046c222c20dSDavid Ham } 104706a1af2fSStefano Zampini if (nnzstate) B->nonzerostate++; 1048c222c20dSDavid Ham PetscFunctionReturn(0); 1049c222c20dSDavid Ham } 1050c222c20dSDavid Ham 10516e76ffeaSPierre Jolivet static PetscErrorCode MatAXPY_Nest(Mat Y,PetscScalar a,Mat X,MatStructure str) 10526e76ffeaSPierre Jolivet { 10536e76ffeaSPierre Jolivet Mat_Nest *bY = (Mat_Nest*)Y->data,*bX = (Mat_Nest*)X->data; 10546e76ffeaSPierre Jolivet PetscInt i,j,nr = bY->nr,nc = bY->nc; 10556e76ffeaSPierre Jolivet PetscErrorCode ierr; 105606a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 10576e76ffeaSPierre Jolivet 10586e76ffeaSPierre Jolivet PetscFunctionBegin; 1059*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr != bX->nr || nc != bX->nc,PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Cannot AXPY a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") with a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")",bX->nr,bX->nc,nr,nc); 10606e76ffeaSPierre Jolivet for (i=0; i<nr; i++) { 10616e76ffeaSPierre Jolivet for (j=0; j<nc; j++) { 106206a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 10636e76ffeaSPierre Jolivet if (bY->m[i][j] && bX->m[i][j]) { 10646e76ffeaSPierre Jolivet ierr = MatAXPY(bY->m[i][j],a,bX->m[i][j],str);CHKERRQ(ierr); 1065c066aebcSStefano Zampini } else if (bX->m[i][j]) { 1066c066aebcSStefano Zampini Mat M; 1067c066aebcSStefano Zampini 1068*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(str != DIFFERENT_NONZERO_PATTERN,PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_INCOMP,"Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT ". Use DIFFERENT_NONZERO_PATTERN",i,j); 1069c066aebcSStefano Zampini ierr = MatDuplicate(bX->m[i][j],MAT_COPY_VALUES,&M);CHKERRQ(ierr); 1070c066aebcSStefano Zampini ierr = MatNestSetSubMat(Y,i,j,M);CHKERRQ(ierr); 1071c066aebcSStefano Zampini ierr = MatDestroy(&M);CHKERRQ(ierr); 1072c066aebcSStefano Zampini } 1073060bfc19SStefano Zampini if (bY->m[i][j]) { ierr = MatGetNonzeroState(bY->m[i][j],&subnnzstate);CHKERRQ(ierr); } 107406a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i*nc+j] != subnnzstate); 107506a1af2fSStefano Zampini bY->nnzstate[i*nc+j] = subnnzstate; 10766e76ffeaSPierre Jolivet } 10776e76ffeaSPierre Jolivet } 107806a1af2fSStefano Zampini if (nnzstate) Y->nonzerostate++; 10796e76ffeaSPierre Jolivet PetscFunctionReturn(0); 10806e76ffeaSPierre Jolivet } 10816e76ffeaSPierre Jolivet 1082207556f9SJed Brown static PetscErrorCode MatDuplicate_Nest(Mat A,MatDuplicateOption op,Mat *B) 1083d8588912SDave May { 1084d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 1085841e96a3SJed Brown Mat *b; 1086841e96a3SJed Brown PetscInt i,j,nr = bA->nr,nc = bA->nc; 1087d8588912SDave May PetscErrorCode ierr; 1088d8588912SDave May 1089d8588912SDave May PetscFunctionBegin; 1090785e854fSJed Brown ierr = PetscMalloc1(nr*nc,&b);CHKERRQ(ierr); 1091841e96a3SJed Brown for (i=0; i<nr; i++) { 1092841e96a3SJed Brown for (j=0; j<nc; j++) { 1093841e96a3SJed Brown if (bA->m[i][j]) { 1094841e96a3SJed Brown ierr = MatDuplicate(bA->m[i][j],op,&b[i*nc+j]);CHKERRQ(ierr); 1095841e96a3SJed Brown } else { 10960298fd71SBarry Smith b[i*nc+j] = NULL; 1097d8588912SDave May } 1098d8588912SDave May } 1099d8588912SDave May } 1100ce94432eSBarry Smith ierr = MatCreateNest(PetscObjectComm((PetscObject)A),nr,bA->isglobal.row,nc,bA->isglobal.col,b,B);CHKERRQ(ierr); 1101841e96a3SJed Brown /* Give the new MatNest exclusive ownership */ 1102841e96a3SJed Brown for (i=0; i<nr*nc; i++) { 11036bf464f9SBarry Smith ierr = MatDestroy(&b[i]);CHKERRQ(ierr); 1104d8588912SDave May } 1105d8588912SDave May ierr = PetscFree(b);CHKERRQ(ierr); 1106d8588912SDave May 1107841e96a3SJed Brown ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1108841e96a3SJed Brown ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1109d8588912SDave May PetscFunctionReturn(0); 1110d8588912SDave May } 1111d8588912SDave May 1112d8588912SDave May /* nest api */ 1113d8588912SDave May PetscErrorCode MatNestGetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat *mat) 1114d8588912SDave May { 1115d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 11165fd66863SKarl Rupp 1117d8588912SDave May PetscFunctionBegin; 1118*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(idxm >= bA->nr,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,idxm,bA->nr-1); 1119*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(jdxm >= bA->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT,jdxm,bA->nc-1); 1120d8588912SDave May *mat = bA->m[idxm][jdxm]; 1121d8588912SDave May PetscFunctionReturn(0); 1122d8588912SDave May } 1123d8588912SDave May 11249ba0d327SJed Brown /*@ 1125d8588912SDave May MatNestGetSubMat - Returns a single, sub-matrix from a nest matrix. 1126d8588912SDave May 1127d8588912SDave May Not collective 1128d8588912SDave May 1129d8588912SDave May Input Parameters: 1130629881c0SJed Brown + A - nest matrix 1131d8588912SDave May . idxm - index of the matrix within the nest matrix 1132629881c0SJed Brown - jdxm - index of the matrix within the nest matrix 1133d8588912SDave May 1134d8588912SDave May Output Parameter: 1135d8588912SDave May . sub - matrix at index idxm,jdxm within the nest matrix 1136d8588912SDave May 1137d8588912SDave May Level: developer 1138d8588912SDave May 1139bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMats(), MatCreateNest(), MATNEST, MatNestSetSubMat(), 114079798668SBarry Smith MatNestGetLocalISs(), MatNestGetISs() 1141d8588912SDave May @*/ 11427087cfbeSBarry Smith PetscErrorCode MatNestGetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat *sub) 1143d8588912SDave May { 1144699a902aSJed Brown PetscErrorCode ierr; 1145d8588912SDave May 1146d8588912SDave May PetscFunctionBegin; 1147699a902aSJed Brown ierr = PetscUseMethod(A,"MatNestGetSubMat_C",(Mat,PetscInt,PetscInt,Mat*),(A,idxm,jdxm,sub));CHKERRQ(ierr); 1148d8588912SDave May PetscFunctionReturn(0); 1149d8588912SDave May } 1150d8588912SDave May 11510782ca92SJed Brown PetscErrorCode MatNestSetSubMat_Nest(Mat A,PetscInt idxm,PetscInt jdxm,Mat mat) 11520782ca92SJed Brown { 11530782ca92SJed Brown Mat_Nest *bA = (Mat_Nest*)A->data; 11540782ca92SJed Brown PetscInt m,n,M,N,mi,ni,Mi,Ni; 11550782ca92SJed Brown PetscErrorCode ierr; 11560782ca92SJed Brown 11570782ca92SJed Brown PetscFunctionBegin; 1158*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(idxm >= bA->nr,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,idxm,bA->nr-1); 1159*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(jdxm >= bA->nc,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT,jdxm,bA->nc-1); 11600782ca92SJed Brown ierr = MatGetLocalSize(mat,&m,&n);CHKERRQ(ierr); 11610782ca92SJed Brown ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 11620782ca92SJed Brown ierr = ISGetLocalSize(bA->isglobal.row[idxm],&mi);CHKERRQ(ierr); 11630782ca92SJed Brown ierr = ISGetSize(bA->isglobal.row[idxm],&Mi);CHKERRQ(ierr); 11640782ca92SJed Brown ierr = ISGetLocalSize(bA->isglobal.col[jdxm],&ni);CHKERRQ(ierr); 11650782ca92SJed Brown ierr = ISGetSize(bA->isglobal.col[jdxm],&Ni);CHKERRQ(ierr); 1166*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(M != Mi || N != Ni,PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")",M,N,Mi,Ni); 1167*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(m != mi || n != ni,PetscObjectComm((PetscObject)mat),PETSC_ERR_ARG_INCOMP,"Submatrix local dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")",m,n,mi,ni); 116826fbe8dcSKarl Rupp 116906a1af2fSStefano Zampini /* do not increase object state */ 117006a1af2fSStefano Zampini if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(0); 117106a1af2fSStefano Zampini 11720782ca92SJed Brown ierr = PetscObjectReference((PetscObject)mat);CHKERRQ(ierr); 11730782ca92SJed Brown ierr = MatDestroy(&bA->m[idxm][jdxm]);CHKERRQ(ierr); 11740782ca92SJed Brown bA->m[idxm][jdxm] = mat; 117506a1af2fSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 117606a1af2fSStefano Zampini ierr = MatGetNonzeroState(mat,&bA->nnzstate[idxm*bA->nc+jdxm]);CHKERRQ(ierr); 117706a1af2fSStefano Zampini A->nonzerostate++; 11780782ca92SJed Brown PetscFunctionReturn(0); 11790782ca92SJed Brown } 11800782ca92SJed Brown 11819ba0d327SJed Brown /*@ 11820782ca92SJed Brown MatNestSetSubMat - Set a single submatrix in the nest matrix. 11830782ca92SJed Brown 11840782ca92SJed Brown Logically collective on the submatrix communicator 11850782ca92SJed Brown 11860782ca92SJed Brown Input Parameters: 11870782ca92SJed Brown + A - nest matrix 11880782ca92SJed Brown . idxm - index of the matrix within the nest matrix 11890782ca92SJed Brown . jdxm - index of the matrix within the nest matrix 11900782ca92SJed Brown - sub - matrix at index idxm,jdxm within the nest matrix 11910782ca92SJed Brown 11920782ca92SJed Brown Notes: 11930782ca92SJed Brown The new submatrix must have the same size and communicator as that block of the nest. 11940782ca92SJed Brown 11950782ca92SJed Brown This increments the reference count of the submatrix. 11960782ca92SJed Brown 11970782ca92SJed Brown Level: developer 11980782ca92SJed Brown 1199bb97c47cSPierre Jolivet .seealso: MatNestSetSubMats(), MatNestGetSubMats(), MatNestGetLocalISs(), MATNEST, MatCreateNest(), 120079798668SBarry Smith MatNestGetSubMat(), MatNestGetISs(), MatNestGetSize() 12010782ca92SJed Brown @*/ 12020782ca92SJed Brown PetscErrorCode MatNestSetSubMat(Mat A,PetscInt idxm,PetscInt jdxm,Mat sub) 12030782ca92SJed Brown { 12040782ca92SJed Brown PetscErrorCode ierr; 12050782ca92SJed Brown 12060782ca92SJed Brown PetscFunctionBegin; 12070782ca92SJed Brown ierr = PetscUseMethod(A,"MatNestSetSubMat_C",(Mat,PetscInt,PetscInt,Mat),(A,idxm,jdxm,sub));CHKERRQ(ierr); 12080782ca92SJed Brown PetscFunctionReturn(0); 12090782ca92SJed Brown } 12100782ca92SJed Brown 1211d8588912SDave May PetscErrorCode MatNestGetSubMats_Nest(Mat A,PetscInt *M,PetscInt *N,Mat ***mat) 1212d8588912SDave May { 1213d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 12145fd66863SKarl Rupp 1215d8588912SDave May PetscFunctionBegin; 121626fbe8dcSKarl Rupp if (M) *M = bA->nr; 121726fbe8dcSKarl Rupp if (N) *N = bA->nc; 121826fbe8dcSKarl Rupp if (mat) *mat = bA->m; 1219d8588912SDave May PetscFunctionReturn(0); 1220d8588912SDave May } 1221d8588912SDave May 1222d8588912SDave May /*@C 1223d8588912SDave May MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a nest matrix. 1224d8588912SDave May 1225d8588912SDave May Not collective 1226d8588912SDave May 1227f899ff85SJose E. Roman Input Parameter: 1228629881c0SJed Brown . A - nest matrix 1229d8588912SDave May 1230d8d19677SJose E. Roman Output Parameters: 1231629881c0SJed Brown + M - number of rows in the nest matrix 1232d8588912SDave May . N - number of cols in the nest matrix 1233629881c0SJed Brown - mat - 2d array of matrices 1234d8588912SDave May 1235d8588912SDave May Notes: 1236d8588912SDave May 1237d8588912SDave May The user should not free the array mat. 1238d8588912SDave May 1239351962e3SVincent Le Chenadec In Fortran, this routine has a calling sequence 1240351962e3SVincent Le Chenadec $ call MatNestGetSubMats(A, M, N, mat, ierr) 1241351962e3SVincent Le Chenadec where the space allocated for the optional argument mat is assumed large enough (if provided). 1242351962e3SVincent Le Chenadec 1243d8588912SDave May Level: developer 1244d8588912SDave May 1245bb97c47cSPierre Jolivet .seealso: MatNestGetSize(), MatNestGetSubMat(), MatNestGetLocalISs(), MATNEST, MatCreateNest(), 124679798668SBarry Smith MatNestSetSubMats(), MatNestGetISs(), MatNestSetSubMat() 1247d8588912SDave May @*/ 12487087cfbeSBarry Smith PetscErrorCode MatNestGetSubMats(Mat A,PetscInt *M,PetscInt *N,Mat ***mat) 1249d8588912SDave May { 1250699a902aSJed Brown PetscErrorCode ierr; 1251d8588912SDave May 1252d8588912SDave May PetscFunctionBegin; 1253699a902aSJed Brown ierr = PetscUseMethod(A,"MatNestGetSubMats_C",(Mat,PetscInt*,PetscInt*,Mat***),(A,M,N,mat));CHKERRQ(ierr); 1254d8588912SDave May PetscFunctionReturn(0); 1255d8588912SDave May } 1256d8588912SDave May 12577087cfbeSBarry Smith PetscErrorCode MatNestGetSize_Nest(Mat A,PetscInt *M,PetscInt *N) 1258d8588912SDave May { 1259d8588912SDave May Mat_Nest *bA = (Mat_Nest*)A->data; 1260d8588912SDave May 1261d8588912SDave May PetscFunctionBegin; 126226fbe8dcSKarl Rupp if (M) *M = bA->nr; 126326fbe8dcSKarl Rupp if (N) *N = bA->nc; 1264d8588912SDave May PetscFunctionReturn(0); 1265d8588912SDave May } 1266d8588912SDave May 12679ba0d327SJed Brown /*@ 1268d8588912SDave May MatNestGetSize - Returns the size of the nest matrix. 1269d8588912SDave May 1270d8588912SDave May Not collective 1271d8588912SDave May 1272f899ff85SJose E. Roman Input Parameter: 1273d8588912SDave May . A - nest matrix 1274d8588912SDave May 1275d8d19677SJose E. Roman Output Parameters: 1276629881c0SJed Brown + M - number of rows in the nested mat 1277629881c0SJed Brown - N - number of cols in the nested mat 1278d8588912SDave May 1279d8588912SDave May Notes: 1280d8588912SDave May 1281d8588912SDave May Level: developer 1282d8588912SDave May 1283bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MATNEST, MatCreateNest(), MatNestGetLocalISs(), 128479798668SBarry Smith MatNestGetISs() 1285d8588912SDave May @*/ 12867087cfbeSBarry Smith PetscErrorCode MatNestGetSize(Mat A,PetscInt *M,PetscInt *N) 1287d8588912SDave May { 1288699a902aSJed Brown PetscErrorCode ierr; 1289d8588912SDave May 1290d8588912SDave May PetscFunctionBegin; 1291699a902aSJed Brown ierr = PetscUseMethod(A,"MatNestGetSize_C",(Mat,PetscInt*,PetscInt*),(A,M,N));CHKERRQ(ierr); 1292d8588912SDave May PetscFunctionReturn(0); 1293d8588912SDave May } 1294d8588912SDave May 1295f7a08781SBarry Smith static PetscErrorCode MatNestGetISs_Nest(Mat A,IS rows[],IS cols[]) 1296900e7ff2SJed Brown { 1297900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 1298900e7ff2SJed Brown PetscInt i; 1299900e7ff2SJed Brown 1300900e7ff2SJed Brown PetscFunctionBegin; 1301900e7ff2SJed Brown if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->isglobal.row[i]; 1302900e7ff2SJed Brown if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->isglobal.col[i]; 1303900e7ff2SJed Brown PetscFunctionReturn(0); 1304900e7ff2SJed Brown } 1305900e7ff2SJed Brown 13063a4d7b9aSSatish Balay /*@C 1307900e7ff2SJed Brown MatNestGetISs - Returns the index sets partitioning the row and column spaces 1308900e7ff2SJed Brown 1309900e7ff2SJed Brown Not collective 1310900e7ff2SJed Brown 1311f899ff85SJose E. Roman Input Parameter: 1312900e7ff2SJed Brown . A - nest matrix 1313900e7ff2SJed Brown 1314d8d19677SJose E. Roman Output Parameters: 1315900e7ff2SJed Brown + rows - array of row index sets 1316900e7ff2SJed Brown - cols - array of column index sets 1317900e7ff2SJed Brown 1318900e7ff2SJed Brown Level: advanced 1319900e7ff2SJed Brown 1320900e7ff2SJed Brown Notes: 1321900e7ff2SJed Brown The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs. 1322900e7ff2SJed Brown 132379798668SBarry Smith .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetLocalISs(), MATNEST, 1324bb97c47cSPierre Jolivet MatCreateNest(), MatNestGetSubMats(), MatNestSetSubMats() 1325900e7ff2SJed Brown @*/ 1326900e7ff2SJed Brown PetscErrorCode MatNestGetISs(Mat A,IS rows[],IS cols[]) 1327900e7ff2SJed Brown { 1328900e7ff2SJed Brown PetscErrorCode ierr; 1329900e7ff2SJed Brown 1330900e7ff2SJed Brown PetscFunctionBegin; 1331900e7ff2SJed Brown PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1332900e7ff2SJed Brown ierr = PetscUseMethod(A,"MatNestGetISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr); 1333900e7ff2SJed Brown PetscFunctionReturn(0); 1334900e7ff2SJed Brown } 1335900e7ff2SJed Brown 1336f7a08781SBarry Smith static PetscErrorCode MatNestGetLocalISs_Nest(Mat A,IS rows[],IS cols[]) 1337900e7ff2SJed Brown { 1338900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 1339900e7ff2SJed Brown PetscInt i; 1340900e7ff2SJed Brown 1341900e7ff2SJed Brown PetscFunctionBegin; 1342900e7ff2SJed Brown if (rows) for (i=0; i<vs->nr; i++) rows[i] = vs->islocal.row[i]; 1343900e7ff2SJed Brown if (cols) for (i=0; i<vs->nc; i++) cols[i] = vs->islocal.col[i]; 1344900e7ff2SJed Brown PetscFunctionReturn(0); 1345900e7ff2SJed Brown } 1346900e7ff2SJed Brown 1347900e7ff2SJed Brown /*@C 1348900e7ff2SJed Brown MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces 1349900e7ff2SJed Brown 1350900e7ff2SJed Brown Not collective 1351900e7ff2SJed Brown 1352f899ff85SJose E. Roman Input Parameter: 1353900e7ff2SJed Brown . A - nest matrix 1354900e7ff2SJed Brown 1355d8d19677SJose E. Roman Output Parameters: 13560298fd71SBarry Smith + rows - array of row index sets (or NULL to ignore) 13570298fd71SBarry Smith - cols - array of column index sets (or NULL to ignore) 1358900e7ff2SJed Brown 1359900e7ff2SJed Brown Level: advanced 1360900e7ff2SJed Brown 1361900e7ff2SJed Brown Notes: 1362900e7ff2SJed Brown The user must have allocated arrays of the correct size. The reference count is not increased on the returned ISs. 1363900e7ff2SJed Brown 1364bb97c47cSPierre Jolivet .seealso: MatNestGetSubMat(), MatNestGetSubMats(), MatNestGetSize(), MatNestGetISs(), MatCreateNest(), 136579798668SBarry Smith MATNEST, MatNestSetSubMats(), MatNestSetSubMat() 1366900e7ff2SJed Brown @*/ 1367900e7ff2SJed Brown PetscErrorCode MatNestGetLocalISs(Mat A,IS rows[],IS cols[]) 1368900e7ff2SJed Brown { 1369900e7ff2SJed Brown PetscErrorCode ierr; 1370900e7ff2SJed Brown 1371900e7ff2SJed Brown PetscFunctionBegin; 1372900e7ff2SJed Brown PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1373900e7ff2SJed Brown ierr = PetscUseMethod(A,"MatNestGetLocalISs_C",(Mat,IS[],IS[]),(A,rows,cols));CHKERRQ(ierr); 1374900e7ff2SJed Brown PetscFunctionReturn(0); 1375900e7ff2SJed Brown } 1376900e7ff2SJed Brown 137719fd82e9SBarry Smith PetscErrorCode MatNestSetVecType_Nest(Mat A,VecType vtype) 1378207556f9SJed Brown { 1379207556f9SJed Brown PetscErrorCode ierr; 1380207556f9SJed Brown PetscBool flg; 1381207556f9SJed Brown 1382207556f9SJed Brown PetscFunctionBegin; 1383207556f9SJed Brown ierr = PetscStrcmp(vtype,VECNEST,&flg);CHKERRQ(ierr); 1384207556f9SJed Brown /* In reality, this only distinguishes VECNEST and "other" */ 13852a7a6963SBarry Smith if (flg) A->ops->getvecs = MatCreateVecs_Nest; 138612b53f24SSatish Balay else A->ops->getvecs = (PetscErrorCode (*)(Mat,Vec*,Vec*)) 0; 1387207556f9SJed Brown PetscFunctionReturn(0); 1388207556f9SJed Brown } 1389207556f9SJed Brown 1390207556f9SJed Brown /*@C 13912a7a6963SBarry Smith MatNestSetVecType - Sets the type of Vec returned by MatCreateVecs() 1392207556f9SJed Brown 1393207556f9SJed Brown Not collective 1394207556f9SJed Brown 1395207556f9SJed Brown Input Parameters: 1396207556f9SJed Brown + A - nest matrix 1397207556f9SJed Brown - vtype - type to use for creating vectors 1398207556f9SJed Brown 1399207556f9SJed Brown Notes: 1400207556f9SJed Brown 1401207556f9SJed Brown Level: developer 1402207556f9SJed Brown 1403bb97c47cSPierre Jolivet .seealso: MatCreateVecs(), MATNEST, MatCreateNest() 1404207556f9SJed Brown @*/ 140519fd82e9SBarry Smith PetscErrorCode MatNestSetVecType(Mat A,VecType vtype) 1406207556f9SJed Brown { 1407207556f9SJed Brown PetscErrorCode ierr; 1408207556f9SJed Brown 1409207556f9SJed Brown PetscFunctionBegin; 141019fd82e9SBarry Smith ierr = PetscTryMethod(A,"MatNestSetVecType_C",(Mat,VecType),(A,vtype));CHKERRQ(ierr); 1411207556f9SJed Brown PetscFunctionReturn(0); 1412207556f9SJed Brown } 1413207556f9SJed Brown 1414c8883902SJed Brown PetscErrorCode MatNestSetSubMats_Nest(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[]) 1415d8588912SDave May { 1416c8883902SJed Brown Mat_Nest *s = (Mat_Nest*)A->data; 1417c8883902SJed Brown PetscInt i,j,m,n,M,N; 1418d8588912SDave May PetscErrorCode ierr; 141988ffe2e8SJose E. Roman PetscBool cong,isstd,sametype=PETSC_FALSE; 142088ffe2e8SJose E. Roman VecType vtype,type; 1421d8588912SDave May 1422d8588912SDave May PetscFunctionBegin; 142306a1af2fSStefano Zampini ierr = MatReset_Nest(A);CHKERRQ(ierr); 142406a1af2fSStefano Zampini 1425c8883902SJed Brown s->nr = nr; 1426c8883902SJed Brown s->nc = nc; 1427d8588912SDave May 1428c8883902SJed Brown /* Create space for submatrices */ 1429854ce69bSBarry Smith ierr = PetscMalloc1(nr,&s->m);CHKERRQ(ierr); 1430c8883902SJed Brown for (i=0; i<nr; i++) { 1431854ce69bSBarry Smith ierr = PetscMalloc1(nc,&s->m[i]);CHKERRQ(ierr); 1432d8588912SDave May } 1433c8883902SJed Brown for (i=0; i<nr; i++) { 1434c8883902SJed Brown for (j=0; j<nc; j++) { 1435c8883902SJed Brown s->m[i][j] = a[i*nc+j]; 1436c8883902SJed Brown if (a[i*nc+j]) { 1437c8883902SJed Brown ierr = PetscObjectReference((PetscObject)a[i*nc+j]);CHKERRQ(ierr); 1438d8588912SDave May } 1439d8588912SDave May } 1440d8588912SDave May } 144188ffe2e8SJose E. Roman ierr = MatGetVecType(A,&vtype);CHKERRQ(ierr); 144288ffe2e8SJose E. Roman ierr = PetscStrcmp(vtype,VECSTANDARD,&isstd);CHKERRQ(ierr); 144388ffe2e8SJose E. Roman if (isstd) { 144488ffe2e8SJose E. Roman /* check if all blocks have the same vectype */ 144588ffe2e8SJose E. Roman vtype = NULL; 144688ffe2e8SJose E. Roman for (i=0; i<nr; i++) { 144788ffe2e8SJose E. Roman for (j=0; j<nc; j++) { 144888ffe2e8SJose E. Roman if (a[i*nc+j]) { 144988ffe2e8SJose E. Roman if (!vtype) { /* first visited block */ 145088ffe2e8SJose E. Roman ierr = MatGetVecType(a[i*nc+j],&vtype);CHKERRQ(ierr); 145188ffe2e8SJose E. Roman sametype = PETSC_TRUE; 145288ffe2e8SJose E. Roman } else if (sametype) { 145388ffe2e8SJose E. Roman ierr = MatGetVecType(a[i*nc+j],&type);CHKERRQ(ierr); 145488ffe2e8SJose E. Roman ierr = PetscStrcmp(vtype,type,&sametype);CHKERRQ(ierr); 145588ffe2e8SJose E. Roman } 145688ffe2e8SJose E. Roman } 145788ffe2e8SJose E. Roman } 145888ffe2e8SJose E. Roman } 145988ffe2e8SJose E. Roman if (sametype) { /* propagate vectype */ 146088ffe2e8SJose E. Roman ierr = MatSetVecType(A,vtype);CHKERRQ(ierr); 146188ffe2e8SJose E. Roman } 146288ffe2e8SJose E. Roman } 1463d8588912SDave May 14648188e55aSJed Brown ierr = MatSetUp_NestIS_Private(A,nr,is_row,nc,is_col);CHKERRQ(ierr); 1465d8588912SDave May 1466854ce69bSBarry Smith ierr = PetscMalloc1(nr,&s->row_len);CHKERRQ(ierr); 1467854ce69bSBarry Smith ierr = PetscMalloc1(nc,&s->col_len);CHKERRQ(ierr); 1468c8883902SJed Brown for (i=0; i<nr; i++) s->row_len[i]=-1; 1469c8883902SJed Brown for (j=0; j<nc; j++) s->col_len[j]=-1; 1470d8588912SDave May 147106a1af2fSStefano Zampini ierr = PetscCalloc1(nr*nc,&s->nnzstate);CHKERRQ(ierr); 147206a1af2fSStefano Zampini for (i=0; i<nr; i++) { 147306a1af2fSStefano Zampini for (j=0; j<nc; j++) { 147406a1af2fSStefano Zampini if (s->m[i][j]) { 147506a1af2fSStefano Zampini ierr = MatGetNonzeroState(s->m[i][j],&s->nnzstate[i*nc+j]);CHKERRQ(ierr); 147606a1af2fSStefano Zampini } 147706a1af2fSStefano Zampini } 147806a1af2fSStefano Zampini } 147906a1af2fSStefano Zampini 14808188e55aSJed Brown ierr = MatNestGetSizes_Private(A,&m,&n,&M,&N);CHKERRQ(ierr); 1481d8588912SDave May 1482c8883902SJed Brown ierr = PetscLayoutSetSize(A->rmap,M);CHKERRQ(ierr); 1483c8883902SJed Brown ierr = PetscLayoutSetLocalSize(A->rmap,m);CHKERRQ(ierr); 1484c8883902SJed Brown ierr = PetscLayoutSetSize(A->cmap,N);CHKERRQ(ierr); 1485c8883902SJed Brown ierr = PetscLayoutSetLocalSize(A->cmap,n);CHKERRQ(ierr); 1486c8883902SJed Brown 1487c8883902SJed Brown ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr); 1488c8883902SJed Brown ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr); 1489c8883902SJed Brown 149006a1af2fSStefano Zampini /* disable operations that are not supported for non-square matrices, 149106a1af2fSStefano Zampini or matrices for which is_row != is_col */ 149206a1af2fSStefano Zampini ierr = MatHasCongruentLayouts(A,&cong);CHKERRQ(ierr); 149306a1af2fSStefano Zampini if (cong && nr != nc) cong = PETSC_FALSE; 149406a1af2fSStefano Zampini if (cong) { 149506a1af2fSStefano Zampini for (i = 0; cong && i < nr; i++) { 1496320466b0SStefano Zampini ierr = ISEqualUnsorted(s->isglobal.row[i],s->isglobal.col[i],&cong);CHKERRQ(ierr); 149706a1af2fSStefano Zampini } 149806a1af2fSStefano Zampini } 149906a1af2fSStefano Zampini if (!cong) { 1500381b8e50SStefano Zampini A->ops->missingdiagonal = NULL; 150106a1af2fSStefano Zampini A->ops->getdiagonal = NULL; 150206a1af2fSStefano Zampini A->ops->shift = NULL; 150306a1af2fSStefano Zampini A->ops->diagonalset = NULL; 150406a1af2fSStefano Zampini } 150506a1af2fSStefano Zampini 15061795a4d1SJed Brown ierr = PetscCalloc2(nr,&s->left,nc,&s->right);CHKERRQ(ierr); 150706a1af2fSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 150806a1af2fSStefano Zampini A->nonzerostate++; 1509d8588912SDave May PetscFunctionReturn(0); 1510d8588912SDave May } 1511d8588912SDave May 1512c8883902SJed Brown /*@ 1513c8883902SJed Brown MatNestSetSubMats - Sets the nested submatrices 1514c8883902SJed Brown 1515c8883902SJed Brown Collective on Mat 1516c8883902SJed Brown 1517d8d19677SJose E. Roman Input Parameters: 1518ffd6319bSRichard Tran Mills + A - nested matrix 1519c8883902SJed Brown . nr - number of nested row blocks 15200298fd71SBarry Smith . is_row - index sets for each nested row block, or NULL to make contiguous 1521c8883902SJed Brown . nc - number of nested column blocks 15220298fd71SBarry Smith . is_col - index sets for each nested column block, or NULL to make contiguous 15230298fd71SBarry Smith - a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL 1524c8883902SJed Brown 152506a1af2fSStefano Zampini Notes: this always resets any submatrix information previously set 152606a1af2fSStefano Zampini 1527c8883902SJed Brown Level: advanced 1528c8883902SJed Brown 152979798668SBarry Smith .seealso: MatCreateNest(), MATNEST, MatNestSetSubMat(), MatNestGetSubMat(), MatNestGetSubMats() 1530c8883902SJed Brown @*/ 1531c8883902SJed Brown PetscErrorCode MatNestSetSubMats(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[]) 1532c8883902SJed Brown { 1533c8883902SJed Brown PetscErrorCode ierr; 153406a1af2fSStefano Zampini PetscInt i; 1535c8883902SJed Brown 1536c8883902SJed Brown PetscFunctionBegin; 1537c8883902SJed Brown PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1538*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(nr < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of rows cannot be negative"); 1539c8883902SJed Brown if (nr && is_row) { 1540c8883902SJed Brown PetscValidPointer(is_row,3); 1541c8883902SJed Brown for (i=0; i<nr; i++) PetscValidHeaderSpecific(is_row[i],IS_CLASSID,3); 1542c8883902SJed Brown } 1543*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(nc < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Number of columns cannot be negative"); 15441664e352SJed Brown if (nc && is_col) { 1545c8883902SJed Brown PetscValidPointer(is_col,5); 15469b30a8f6SBarry Smith for (i=0; i<nc; i++) PetscValidHeaderSpecific(is_col[i],IS_CLASSID,5); 1547c8883902SJed Brown } 154806a1af2fSStefano Zampini if (nr*nc > 0) PetscValidPointer(a,6); 1549c8883902SJed Brown ierr = PetscUseMethod(A,"MatNestSetSubMats_C",(Mat,PetscInt,const IS[],PetscInt,const IS[],const Mat[]),(A,nr,is_row,nc,is_col,a));CHKERRQ(ierr); 1550c8883902SJed Brown PetscFunctionReturn(0); 1551c8883902SJed Brown } 1552d8588912SDave May 155345b6f7e9SBarry Smith static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A,PetscInt n,const IS islocal[],const IS isglobal[],PetscBool colflg,ISLocalToGlobalMapping *ltog) 155477019fcaSJed Brown { 155577019fcaSJed Brown PetscErrorCode ierr; 155677019fcaSJed Brown PetscBool flg; 155777019fcaSJed Brown PetscInt i,j,m,mi,*ix; 155877019fcaSJed Brown 155977019fcaSJed Brown PetscFunctionBegin; 1560aea6d515SStefano Zampini *ltog = NULL; 156177019fcaSJed Brown for (i=0,m=0,flg=PETSC_FALSE; i<n; i++) { 156277019fcaSJed Brown if (islocal[i]) { 1563aea6d515SStefano Zampini ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr); 156477019fcaSJed Brown flg = PETSC_TRUE; /* We found a non-trivial entry */ 156577019fcaSJed Brown } else { 1566aea6d515SStefano Zampini ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr); 156777019fcaSJed Brown } 156877019fcaSJed Brown m += mi; 156977019fcaSJed Brown } 1570aea6d515SStefano Zampini if (!flg) PetscFunctionReturn(0); 1571aea6d515SStefano Zampini 1572785e854fSJed Brown ierr = PetscMalloc1(m,&ix);CHKERRQ(ierr); 1573165cd838SBarry Smith for (i=0,m=0; i<n; i++) { 15740298fd71SBarry Smith ISLocalToGlobalMapping smap = NULL; 1575e108cb99SStefano Zampini Mat sub = NULL; 1576f6d38dbbSStefano Zampini PetscSF sf; 1577f6d38dbbSStefano Zampini PetscLayout map; 1578aea6d515SStefano Zampini const PetscInt *ix2; 157977019fcaSJed Brown 1580165cd838SBarry Smith if (!colflg) { 158177019fcaSJed Brown ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr); 158277019fcaSJed Brown } else { 158377019fcaSJed Brown ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr); 158477019fcaSJed Brown } 1585191fd14bSBarry Smith if (sub) { 1586191fd14bSBarry Smith if (!colflg) { 1587191fd14bSBarry Smith ierr = MatGetLocalToGlobalMapping(sub,&smap,NULL);CHKERRQ(ierr); 1588191fd14bSBarry Smith } else { 1589191fd14bSBarry Smith ierr = MatGetLocalToGlobalMapping(sub,NULL,&smap);CHKERRQ(ierr); 1590191fd14bSBarry Smith } 1591191fd14bSBarry Smith } 159277019fcaSJed Brown /* 159377019fcaSJed Brown Now we need to extract the monolithic global indices that correspond to the given split global indices. 159477019fcaSJed Brown In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces. 159577019fcaSJed Brown */ 1596aea6d515SStefano Zampini ierr = ISGetIndices(isglobal[i],&ix2);CHKERRQ(ierr); 1597aea6d515SStefano Zampini if (islocal[i]) { 1598aea6d515SStefano Zampini PetscInt *ilocal,*iremote; 1599aea6d515SStefano Zampini PetscInt mil,nleaves; 1600aea6d515SStefano Zampini 1601aea6d515SStefano Zampini ierr = ISGetLocalSize(islocal[i],&mi);CHKERRQ(ierr); 1602*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!smap,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"Missing local to global map"); 1603aea6d515SStefano Zampini for (j=0; j<mi; j++) ix[m+j] = j; 1604aea6d515SStefano Zampini ierr = ISLocalToGlobalMappingApply(smap,mi,ix+m,ix+m);CHKERRQ(ierr); 1605aea6d515SStefano Zampini 1606aea6d515SStefano Zampini /* PetscSFSetGraphLayout does not like negative indices */ 1607aea6d515SStefano Zampini ierr = PetscMalloc2(mi,&ilocal,mi,&iremote);CHKERRQ(ierr); 1608aea6d515SStefano Zampini for (j=0, nleaves = 0; j<mi; j++) { 1609aea6d515SStefano Zampini if (ix[m+j] < 0) continue; 1610aea6d515SStefano Zampini ilocal[nleaves] = j; 1611aea6d515SStefano Zampini iremote[nleaves] = ix[m+j]; 1612aea6d515SStefano Zampini nleaves++; 1613aea6d515SStefano Zampini } 1614aea6d515SStefano Zampini ierr = ISGetLocalSize(isglobal[i],&mil);CHKERRQ(ierr); 1615aea6d515SStefano Zampini ierr = PetscSFCreate(PetscObjectComm((PetscObject)A),&sf);CHKERRQ(ierr); 1616aea6d515SStefano Zampini ierr = PetscLayoutCreate(PetscObjectComm((PetscObject)A),&map);CHKERRQ(ierr); 1617aea6d515SStefano Zampini ierr = PetscLayoutSetLocalSize(map,mil);CHKERRQ(ierr); 1618f6d38dbbSStefano Zampini ierr = PetscLayoutSetUp(map);CHKERRQ(ierr); 1619aea6d515SStefano Zampini ierr = PetscSFSetGraphLayout(sf,map,nleaves,ilocal,PETSC_USE_POINTER,iremote);CHKERRQ(ierr); 1620f6d38dbbSStefano Zampini ierr = PetscLayoutDestroy(&map);CHKERRQ(ierr); 1621ad227feaSJunchao Zhang ierr = PetscSFBcastBegin(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE);CHKERRQ(ierr); 1622ad227feaSJunchao Zhang ierr = PetscSFBcastEnd(sf,MPIU_INT,ix2,ix + m,MPI_REPLACE);CHKERRQ(ierr); 1623f6d38dbbSStefano Zampini ierr = PetscSFDestroy(&sf);CHKERRQ(ierr); 1624aea6d515SStefano Zampini ierr = PetscFree2(ilocal,iremote);CHKERRQ(ierr); 1625aea6d515SStefano Zampini } else { 1626aea6d515SStefano Zampini ierr = ISGetLocalSize(isglobal[i],&mi);CHKERRQ(ierr); 1627aea6d515SStefano Zampini for (j=0; j<mi; j++) ix[m+j] = ix2[i]; 1628aea6d515SStefano Zampini } 1629aea6d515SStefano Zampini ierr = ISRestoreIndices(isglobal[i],&ix2);CHKERRQ(ierr); 163077019fcaSJed Brown m += mi; 163177019fcaSJed Brown } 1632f0413b6fSBarry Smith ierr = ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A),1,m,ix,PETSC_OWN_POINTER,ltog);CHKERRQ(ierr); 163377019fcaSJed Brown PetscFunctionReturn(0); 163477019fcaSJed Brown } 163577019fcaSJed Brown 1636d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */ 1637d8588912SDave May /* 1638d8588912SDave May nprocessors = NP 1639d8588912SDave May Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1)) 1640d8588912SDave May proc 0: => (g_0,h_0,) 1641d8588912SDave May proc 1: => (g_1,h_1,) 1642d8588912SDave May ... 1643d8588912SDave May proc nprocs-1: => (g_NP-1,h_NP-1,) 1644d8588912SDave May 1645d8588912SDave May proc 0: proc 1: proc nprocs-1: 1646d8588912SDave May is[0] = (0,1,2,...,nlocal(g_0)-1) (0,1,...,nlocal(g_1)-1) (0,1,...,nlocal(g_NP-1)) 1647d8588912SDave May 1648d8588912SDave May proc 0: 1649d8588912SDave May is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1) 1650d8588912SDave May proc 1: 1651d8588912SDave May is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1) 1652d8588912SDave May 1653d8588912SDave May proc NP-1: 1654d8588912SDave May is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1) 1655d8588912SDave May */ 1656841e96a3SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat A,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[]) 1657d8588912SDave May { 1658e2d7f03fSJed Brown Mat_Nest *vs = (Mat_Nest*)A->data; 16598188e55aSJed Brown PetscInt i,j,offset,n,nsum,bs; 1660d8588912SDave May PetscErrorCode ierr; 16610298fd71SBarry Smith Mat sub = NULL; 1662d8588912SDave May 1663d8588912SDave May PetscFunctionBegin; 1664854ce69bSBarry Smith ierr = PetscMalloc1(nr,&vs->isglobal.row);CHKERRQ(ierr); 1665854ce69bSBarry Smith ierr = PetscMalloc1(nc,&vs->isglobal.col);CHKERRQ(ierr); 1666d8588912SDave May if (is_row) { /* valid IS is passed in */ 1667a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1668e2d7f03fSJed Brown for (i=0; i<vs->nr; i++) { 1669d8588912SDave May ierr = PetscObjectReference((PetscObject)is_row[i]);CHKERRQ(ierr); 167026fbe8dcSKarl Rupp 1671e2d7f03fSJed Brown vs->isglobal.row[i] = is_row[i]; 1672d8588912SDave May } 16732ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each row */ 16748188e55aSJed Brown nsum = 0; 16758188e55aSJed Brown for (i=0; i<vs->nr; i++) { /* Add up the local sizes to compute the aggregate offset */ 16768188e55aSJed Brown ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr); 1677*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in row %" PetscInt_FMT,i); 16780298fd71SBarry Smith ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr); 1679*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(n < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix"); 16808188e55aSJed Brown nsum += n; 16818188e55aSJed Brown } 168255b25c41SPierre Jolivet ierr = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr); 168330bc264bSJed Brown offset -= nsum; 1684e2d7f03fSJed Brown for (i=0; i<vs->nr; i++) { 1685f349c1fdSJed Brown ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr); 16860298fd71SBarry Smith ierr = MatGetLocalSize(sub,&n,NULL);CHKERRQ(ierr); 168773b6653fSLawrence Mitchell ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr); 1688ce94432eSBarry Smith ierr = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.row[i]);CHKERRQ(ierr); 1689e2d7f03fSJed Brown ierr = ISSetBlockSize(vs->isglobal.row[i],bs);CHKERRQ(ierr); 16902ae74bdbSJed Brown offset += n; 1691d8588912SDave May } 1692d8588912SDave May } 1693d8588912SDave May 1694d8588912SDave May if (is_col) { /* valid IS is passed in */ 1695a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1696e2d7f03fSJed Brown for (j=0; j<vs->nc; j++) { 1697d8588912SDave May ierr = PetscObjectReference((PetscObject)is_col[j]);CHKERRQ(ierr); 169826fbe8dcSKarl Rupp 1699e2d7f03fSJed Brown vs->isglobal.col[j] = is_col[j]; 1700d8588912SDave May } 17012ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each column */ 17022ae74bdbSJed Brown offset = A->cmap->rstart; 17038188e55aSJed Brown nsum = 0; 17048188e55aSJed Brown for (j=0; j<vs->nc; j++) { 17058188e55aSJed Brown ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr); 1706*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!sub,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"No nonzero submatrix in column %" PetscInt_FMT,i); 17070298fd71SBarry Smith ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr); 1708*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(n < 0,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONGSTATE,"Sizes have not yet been set for submatrix"); 17098188e55aSJed Brown nsum += n; 17108188e55aSJed Brown } 171155b25c41SPierre Jolivet ierr = MPI_Scan(&nsum,&offset,1,MPIU_INT,MPI_SUM,PetscObjectComm((PetscObject)A));CHKERRMPI(ierr); 171230bc264bSJed Brown offset -= nsum; 1713e2d7f03fSJed Brown for (j=0; j<vs->nc; j++) { 1714f349c1fdSJed Brown ierr = MatNestFindNonzeroSubMatCol(A,j,&sub);CHKERRQ(ierr); 17150298fd71SBarry Smith ierr = MatGetLocalSize(sub,NULL,&n);CHKERRQ(ierr); 171673b6653fSLawrence Mitchell ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr); 1717ce94432eSBarry Smith ierr = ISCreateStride(PetscObjectComm((PetscObject)sub),n,offset,1,&vs->isglobal.col[j]);CHKERRQ(ierr); 1718e2d7f03fSJed Brown ierr = ISSetBlockSize(vs->isglobal.col[j],bs);CHKERRQ(ierr); 17192ae74bdbSJed Brown offset += n; 1720d8588912SDave May } 1721d8588912SDave May } 1722e2d7f03fSJed Brown 1723e2d7f03fSJed Brown /* Set up the local ISs */ 1724785e854fSJed Brown ierr = PetscMalloc1(vs->nr,&vs->islocal.row);CHKERRQ(ierr); 1725785e854fSJed Brown ierr = PetscMalloc1(vs->nc,&vs->islocal.col);CHKERRQ(ierr); 1726e2d7f03fSJed Brown for (i=0,offset=0; i<vs->nr; i++) { 1727e2d7f03fSJed Brown IS isloc; 17280298fd71SBarry Smith ISLocalToGlobalMapping rmap = NULL; 1729e2d7f03fSJed Brown PetscInt nlocal,bs; 1730e2d7f03fSJed Brown ierr = MatNestFindNonzeroSubMatRow(A,i,&sub);CHKERRQ(ierr); 17310298fd71SBarry Smith if (sub) {ierr = MatGetLocalToGlobalMapping(sub,&rmap,NULL);CHKERRQ(ierr);} 1732207556f9SJed Brown if (rmap) { 173373b6653fSLawrence Mitchell ierr = MatGetBlockSizes(sub,&bs,NULL);CHKERRQ(ierr); 1734e2d7f03fSJed Brown ierr = ISLocalToGlobalMappingGetSize(rmap,&nlocal);CHKERRQ(ierr); 1735e2d7f03fSJed Brown ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr); 1736e2d7f03fSJed Brown ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr); 1737207556f9SJed Brown } else { 1738207556f9SJed Brown nlocal = 0; 17390298fd71SBarry Smith isloc = NULL; 1740207556f9SJed Brown } 1741e2d7f03fSJed Brown vs->islocal.row[i] = isloc; 1742e2d7f03fSJed Brown offset += nlocal; 1743e2d7f03fSJed Brown } 17448188e55aSJed Brown for (i=0,offset=0; i<vs->nc; i++) { 1745e2d7f03fSJed Brown IS isloc; 17460298fd71SBarry Smith ISLocalToGlobalMapping cmap = NULL; 1747e2d7f03fSJed Brown PetscInt nlocal,bs; 1748e2d7f03fSJed Brown ierr = MatNestFindNonzeroSubMatCol(A,i,&sub);CHKERRQ(ierr); 17490298fd71SBarry Smith if (sub) {ierr = MatGetLocalToGlobalMapping(sub,NULL,&cmap);CHKERRQ(ierr);} 1750207556f9SJed Brown if (cmap) { 175173b6653fSLawrence Mitchell ierr = MatGetBlockSizes(sub,NULL,&bs);CHKERRQ(ierr); 1752e2d7f03fSJed Brown ierr = ISLocalToGlobalMappingGetSize(cmap,&nlocal);CHKERRQ(ierr); 1753e2d7f03fSJed Brown ierr = ISCreateStride(PETSC_COMM_SELF,nlocal,offset,1,&isloc);CHKERRQ(ierr); 1754e2d7f03fSJed Brown ierr = ISSetBlockSize(isloc,bs);CHKERRQ(ierr); 1755207556f9SJed Brown } else { 1756207556f9SJed Brown nlocal = 0; 17570298fd71SBarry Smith isloc = NULL; 1758207556f9SJed Brown } 1759e2d7f03fSJed Brown vs->islocal.col[i] = isloc; 1760e2d7f03fSJed Brown offset += nlocal; 1761e2d7f03fSJed Brown } 17620189643fSJed Brown 176377019fcaSJed Brown /* Set up the aggregate ISLocalToGlobalMapping */ 176477019fcaSJed Brown { 176545b6f7e9SBarry Smith ISLocalToGlobalMapping rmap,cmap; 176645b6f7e9SBarry Smith ierr = MatNestCreateAggregateL2G_Private(A,vs->nr,vs->islocal.row,vs->isglobal.row,PETSC_FALSE,&rmap);CHKERRQ(ierr); 176745b6f7e9SBarry Smith ierr = MatNestCreateAggregateL2G_Private(A,vs->nc,vs->islocal.col,vs->isglobal.col,PETSC_TRUE,&cmap);CHKERRQ(ierr); 176877019fcaSJed Brown if (rmap && cmap) {ierr = MatSetLocalToGlobalMapping(A,rmap,cmap);CHKERRQ(ierr);} 176977019fcaSJed Brown ierr = ISLocalToGlobalMappingDestroy(&rmap);CHKERRQ(ierr); 177077019fcaSJed Brown ierr = ISLocalToGlobalMappingDestroy(&cmap);CHKERRQ(ierr); 177177019fcaSJed Brown } 177277019fcaSJed Brown 177376bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 17740189643fSJed Brown for (i=0; i<vs->nr; i++) { 17750189643fSJed Brown for (j=0; j<vs->nc; j++) { 17760189643fSJed Brown PetscInt m,n,M,N,mi,ni,Mi,Ni; 17770189643fSJed Brown Mat B = vs->m[i][j]; 17780189643fSJed Brown if (!B) continue; 17790189643fSJed Brown ierr = MatGetSize(B,&M,&N);CHKERRQ(ierr); 17800189643fSJed Brown ierr = MatGetLocalSize(B,&m,&n);CHKERRQ(ierr); 17810189643fSJed Brown ierr = ISGetSize(vs->isglobal.row[i],&Mi);CHKERRQ(ierr); 17820189643fSJed Brown ierr = ISGetSize(vs->isglobal.col[j],&Ni);CHKERRQ(ierr); 17830189643fSJed Brown ierr = ISGetLocalSize(vs->isglobal.row[i],&mi);CHKERRQ(ierr); 17840189643fSJed Brown ierr = ISGetLocalSize(vs->isglobal.col[j],&ni);CHKERRQ(ierr); 1785*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(M != Mi || N != Ni,PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Global sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")",M,N,i,j,Mi,Ni); 1786*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(m != mi || n != ni,PetscObjectComm((PetscObject)sub),PETSC_ERR_ARG_INCOMP,"Local sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")",m,n,i,j,mi,ni); 17870189643fSJed Brown } 17880189643fSJed Brown } 178976bd3646SJed Brown } 1790a061e289SJed Brown 1791a061e289SJed Brown /* Set A->assembled if all non-null blocks are currently assembled */ 1792a061e289SJed Brown for (i=0; i<vs->nr; i++) { 1793a061e289SJed Brown for (j=0; j<vs->nc; j++) { 1794a061e289SJed Brown if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(0); 1795a061e289SJed Brown } 1796a061e289SJed Brown } 1797a061e289SJed Brown A->assembled = PETSC_TRUE; 1798d8588912SDave May PetscFunctionReturn(0); 1799d8588912SDave May } 1800d8588912SDave May 180145c38901SJed Brown /*@C 1802659c6bb0SJed Brown MatCreateNest - Creates a new matrix containing several nested submatrices, each stored separately 1803659c6bb0SJed Brown 1804659c6bb0SJed Brown Collective on Mat 1805659c6bb0SJed Brown 1806d8d19677SJose E. Roman Input Parameters: 1807659c6bb0SJed Brown + comm - Communicator for the new Mat 1808659c6bb0SJed Brown . nr - number of nested row blocks 18090298fd71SBarry Smith . is_row - index sets for each nested row block, or NULL to make contiguous 1810659c6bb0SJed Brown . nc - number of nested column blocks 18110298fd71SBarry Smith . is_col - index sets for each nested column block, or NULL to make contiguous 18120298fd71SBarry Smith - a - row-aligned array of nr*nc submatrices, empty submatrices can be passed using NULL 1813659c6bb0SJed Brown 1814659c6bb0SJed Brown Output Parameter: 1815659c6bb0SJed Brown . B - new matrix 1816659c6bb0SJed Brown 1817659c6bb0SJed Brown Level: advanced 1818659c6bb0SJed Brown 181979798668SBarry Smith .seealso: MatCreate(), VecCreateNest(), DMCreateMatrix(), MATNEST, MatNestSetSubMat(), 182079798668SBarry Smith MatNestGetSubMat(), MatNestGetLocalISs(), MatNestGetSize(), 182179798668SBarry Smith MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats() 1822659c6bb0SJed Brown @*/ 18237087cfbeSBarry Smith PetscErrorCode MatCreateNest(MPI_Comm comm,PetscInt nr,const IS is_row[],PetscInt nc,const IS is_col[],const Mat a[],Mat *B) 1824d8588912SDave May { 1825d8588912SDave May Mat A; 1826d8588912SDave May PetscErrorCode ierr; 1827d8588912SDave May 1828d8588912SDave May PetscFunctionBegin; 1829f4259b30SLisandro Dalcin *B = NULL; 1830d8588912SDave May ierr = MatCreate(comm,&A);CHKERRQ(ierr); 1831c8883902SJed Brown ierr = MatSetType(A,MATNEST);CHKERRQ(ierr); 183291a28eb3SBarry Smith A->preallocated = PETSC_TRUE; 1833c8883902SJed Brown ierr = MatNestSetSubMats(A,nr,is_row,nc,is_col,a);CHKERRQ(ierr); 1834d8588912SDave May *B = A; 1835d8588912SDave May PetscFunctionReturn(0); 1836d8588912SDave May } 1837659c6bb0SJed Brown 1838be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 1839b68353e5Sstefano_zampini { 1840b68353e5Sstefano_zampini Mat_Nest *nest = (Mat_Nest*)A->data; 184123875855Sstefano_zampini Mat *trans; 1842b68353e5Sstefano_zampini PetscScalar **avv; 1843b68353e5Sstefano_zampini PetscScalar *vv; 1844b68353e5Sstefano_zampini PetscInt **aii,**ajj; 1845b68353e5Sstefano_zampini PetscInt *ii,*jj,*ci; 1846b68353e5Sstefano_zampini PetscInt nr,nc,nnz,i,j; 1847b68353e5Sstefano_zampini PetscBool done; 1848b68353e5Sstefano_zampini PetscErrorCode ierr; 1849b68353e5Sstefano_zampini 1850b68353e5Sstefano_zampini PetscFunctionBegin; 1851b68353e5Sstefano_zampini ierr = MatGetSize(A,&nr,&nc);CHKERRQ(ierr); 1852b68353e5Sstefano_zampini if (reuse == MAT_REUSE_MATRIX) { 1853b68353e5Sstefano_zampini PetscInt rnr; 1854b68353e5Sstefano_zampini 1855b68353e5Sstefano_zampini ierr = MatGetRowIJ(*newmat,0,PETSC_FALSE,PETSC_FALSE,&rnr,(const PetscInt**)&ii,(const PetscInt**)&jj,&done);CHKERRQ(ierr); 1856*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!done,PetscObjectComm((PetscObject)A),PETSC_ERR_PLIB,"MatGetRowIJ"); 1857*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(rnr != nr,PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of rows"); 1858b68353e5Sstefano_zampini ierr = MatSeqAIJGetArray(*newmat,&vv);CHKERRQ(ierr); 1859b68353e5Sstefano_zampini } 1860b68353e5Sstefano_zampini /* extract CSR for nested SeqAIJ matrices */ 1861b68353e5Sstefano_zampini nnz = 0; 186223875855Sstefano_zampini ierr = PetscCalloc4(nest->nr*nest->nc,&aii,nest->nr*nest->nc,&ajj,nest->nr*nest->nc,&avv,nest->nr*nest->nc,&trans);CHKERRQ(ierr); 1863b68353e5Sstefano_zampini for (i=0; i<nest->nr; ++i) { 1864b68353e5Sstefano_zampini for (j=0; j<nest->nc; ++j) { 1865b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1866b68353e5Sstefano_zampini if (B) { 1867b68353e5Sstefano_zampini PetscScalar *naa; 1868b68353e5Sstefano_zampini PetscInt *nii,*njj,nnr; 186923875855Sstefano_zampini PetscBool istrans; 1870b68353e5Sstefano_zampini 187123875855Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr); 187223875855Sstefano_zampini if (istrans) { 187323875855Sstefano_zampini Mat Bt; 187423875855Sstefano_zampini 187523875855Sstefano_zampini ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr); 187623875855Sstefano_zampini ierr = MatTranspose(Bt,MAT_INITIAL_MATRIX,&trans[i*nest->nc+j]);CHKERRQ(ierr); 187723875855Sstefano_zampini B = trans[i*nest->nc+j]; 187823875855Sstefano_zampini } 1879b68353e5Sstefano_zampini ierr = MatGetRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&nii,(const PetscInt**)&njj,&done);CHKERRQ(ierr); 1880*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!done,PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatGetRowIJ"); 1881b68353e5Sstefano_zampini ierr = MatSeqAIJGetArray(B,&naa);CHKERRQ(ierr); 1882b68353e5Sstefano_zampini nnz += nii[nnr]; 1883b68353e5Sstefano_zampini 1884b68353e5Sstefano_zampini aii[i*nest->nc+j] = nii; 1885b68353e5Sstefano_zampini ajj[i*nest->nc+j] = njj; 1886b68353e5Sstefano_zampini avv[i*nest->nc+j] = naa; 1887b68353e5Sstefano_zampini } 1888b68353e5Sstefano_zampini } 1889b68353e5Sstefano_zampini } 1890b68353e5Sstefano_zampini if (reuse != MAT_REUSE_MATRIX) { 1891b68353e5Sstefano_zampini ierr = PetscMalloc1(nr+1,&ii);CHKERRQ(ierr); 1892b68353e5Sstefano_zampini ierr = PetscMalloc1(nnz,&jj);CHKERRQ(ierr); 1893b68353e5Sstefano_zampini ierr = PetscMalloc1(nnz,&vv);CHKERRQ(ierr); 1894b68353e5Sstefano_zampini } else { 1895*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(nnz != ii[nr],PetscObjectComm((PetscObject)A),PETSC_ERR_USER,"Cannot reuse matrix, wrong number of nonzeros"); 1896b68353e5Sstefano_zampini } 1897b68353e5Sstefano_zampini 1898b68353e5Sstefano_zampini /* new row pointer */ 1899580bdb30SBarry Smith ierr = PetscArrayzero(ii,nr+1);CHKERRQ(ierr); 1900b68353e5Sstefano_zampini for (i=0; i<nest->nr; ++i) { 1901b68353e5Sstefano_zampini PetscInt ncr,rst; 1902b68353e5Sstefano_zampini 1903b68353e5Sstefano_zampini ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr); 1904b68353e5Sstefano_zampini ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr); 1905b68353e5Sstefano_zampini for (j=0; j<nest->nc; ++j) { 1906b68353e5Sstefano_zampini if (aii[i*nest->nc+j]) { 1907b68353e5Sstefano_zampini PetscInt *nii = aii[i*nest->nc+j]; 1908b68353e5Sstefano_zampini PetscInt ir; 1909b68353e5Sstefano_zampini 1910b68353e5Sstefano_zampini for (ir=rst; ir<ncr+rst; ++ir) { 1911b68353e5Sstefano_zampini ii[ir+1] += nii[1]-nii[0]; 1912b68353e5Sstefano_zampini nii++; 1913b68353e5Sstefano_zampini } 1914b68353e5Sstefano_zampini } 1915b68353e5Sstefano_zampini } 1916b68353e5Sstefano_zampini } 1917b68353e5Sstefano_zampini for (i=0; i<nr; i++) ii[i+1] += ii[i]; 1918b68353e5Sstefano_zampini 1919b68353e5Sstefano_zampini /* construct CSR for the new matrix */ 1920b68353e5Sstefano_zampini ierr = PetscCalloc1(nr,&ci);CHKERRQ(ierr); 1921b68353e5Sstefano_zampini for (i=0; i<nest->nr; ++i) { 1922b68353e5Sstefano_zampini PetscInt ncr,rst; 1923b68353e5Sstefano_zampini 1924b68353e5Sstefano_zampini ierr = ISStrideGetInfo(nest->isglobal.row[i],&rst,NULL);CHKERRQ(ierr); 1925b68353e5Sstefano_zampini ierr = ISGetLocalSize(nest->isglobal.row[i],&ncr);CHKERRQ(ierr); 1926b68353e5Sstefano_zampini for (j=0; j<nest->nc; ++j) { 1927b68353e5Sstefano_zampini if (aii[i*nest->nc+j]) { 1928b68353e5Sstefano_zampini PetscScalar *nvv = avv[i*nest->nc+j]; 1929b68353e5Sstefano_zampini PetscInt *nii = aii[i*nest->nc+j]; 1930b68353e5Sstefano_zampini PetscInt *njj = ajj[i*nest->nc+j]; 1931b68353e5Sstefano_zampini PetscInt ir,cst; 1932b68353e5Sstefano_zampini 1933b68353e5Sstefano_zampini ierr = ISStrideGetInfo(nest->isglobal.col[j],&cst,NULL);CHKERRQ(ierr); 1934b68353e5Sstefano_zampini for (ir=rst; ir<ncr+rst; ++ir) { 1935b68353e5Sstefano_zampini PetscInt ij,rsize = nii[1]-nii[0],ist = ii[ir]+ci[ir]; 1936b68353e5Sstefano_zampini 1937b68353e5Sstefano_zampini for (ij=0;ij<rsize;ij++) { 1938b68353e5Sstefano_zampini jj[ist+ij] = *njj+cst; 1939b68353e5Sstefano_zampini vv[ist+ij] = *nvv; 1940b68353e5Sstefano_zampini njj++; 1941b68353e5Sstefano_zampini nvv++; 1942b68353e5Sstefano_zampini } 1943b68353e5Sstefano_zampini ci[ir] += rsize; 1944b68353e5Sstefano_zampini nii++; 1945b68353e5Sstefano_zampini } 1946b68353e5Sstefano_zampini } 1947b68353e5Sstefano_zampini } 1948b68353e5Sstefano_zampini } 1949b68353e5Sstefano_zampini ierr = PetscFree(ci);CHKERRQ(ierr); 1950b68353e5Sstefano_zampini 1951b68353e5Sstefano_zampini /* restore info */ 1952b68353e5Sstefano_zampini for (i=0; i<nest->nr; ++i) { 1953b68353e5Sstefano_zampini for (j=0; j<nest->nc; ++j) { 1954b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1955b68353e5Sstefano_zampini if (B) { 1956b68353e5Sstefano_zampini PetscInt nnr = 0, k = i*nest->nc+j; 195723875855Sstefano_zampini 195823875855Sstefano_zampini B = (trans[k] ? trans[k] : B); 1959b68353e5Sstefano_zampini ierr = MatRestoreRowIJ(B,0,PETSC_FALSE,PETSC_FALSE,&nnr,(const PetscInt**)&aii[k],(const PetscInt**)&ajj[k],&done);CHKERRQ(ierr); 1960*2c71b3e2SJacob Faibussowitsch PetscCheckFalse(!done,PetscObjectComm((PetscObject)B),PETSC_ERR_PLIB,"MatRestoreRowIJ"); 1961b68353e5Sstefano_zampini ierr = MatSeqAIJRestoreArray(B,&avv[k]);CHKERRQ(ierr); 196223875855Sstefano_zampini ierr = MatDestroy(&trans[k]);CHKERRQ(ierr); 1963b68353e5Sstefano_zampini } 1964b68353e5Sstefano_zampini } 1965b68353e5Sstefano_zampini } 196623875855Sstefano_zampini ierr = PetscFree4(aii,ajj,avv,trans);CHKERRQ(ierr); 1967b68353e5Sstefano_zampini 1968b68353e5Sstefano_zampini /* finalize newmat */ 1969b68353e5Sstefano_zampini if (reuse == MAT_INITIAL_MATRIX) { 1970b68353e5Sstefano_zampini ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,newmat);CHKERRQ(ierr); 1971b68353e5Sstefano_zampini } else if (reuse == MAT_INPLACE_MATRIX) { 1972b68353e5Sstefano_zampini Mat B; 1973b68353e5Sstefano_zampini 1974b68353e5Sstefano_zampini ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),nr,nc,ii,jj,vv,&B);CHKERRQ(ierr); 1975b68353e5Sstefano_zampini ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 1976b68353e5Sstefano_zampini } 1977b68353e5Sstefano_zampini ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1978b68353e5Sstefano_zampini ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1979b68353e5Sstefano_zampini { 1980b68353e5Sstefano_zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)((*newmat)->data); 1981b68353e5Sstefano_zampini a->free_a = PETSC_TRUE; 1982b68353e5Sstefano_zampini a->free_ij = PETSC_TRUE; 1983b68353e5Sstefano_zampini } 1984b68353e5Sstefano_zampini PetscFunctionReturn(0); 1985b68353e5Sstefano_zampini } 1986b68353e5Sstefano_zampini 1987be705e3aSPierre Jolivet PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y,PetscScalar a,Mat X) 1988be705e3aSPierre Jolivet { 1989be705e3aSPierre Jolivet Mat_Nest *nest = (Mat_Nest*)X->data; 1990be705e3aSPierre Jolivet PetscInt i,j,k,rstart; 1991be705e3aSPierre Jolivet PetscBool flg; 1992be705e3aSPierre Jolivet PetscErrorCode ierr; 1993be705e3aSPierre Jolivet 1994be705e3aSPierre Jolivet PetscFunctionBegin; 1995be705e3aSPierre Jolivet /* Fill by row */ 1996be705e3aSPierre Jolivet for (j=0; j<nest->nc; ++j) { 1997be705e3aSPierre Jolivet /* Using global column indices and ISAllGather() is not scalable. */ 1998be705e3aSPierre Jolivet IS bNis; 1999be705e3aSPierre Jolivet PetscInt bN; 2000be705e3aSPierre Jolivet const PetscInt *bNindices; 2001be705e3aSPierre Jolivet ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr); 2002be705e3aSPierre Jolivet ierr = ISGetSize(bNis,&bN);CHKERRQ(ierr); 2003be705e3aSPierre Jolivet ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr); 2004be705e3aSPierre Jolivet for (i=0; i<nest->nr; ++i) { 2005be705e3aSPierre Jolivet Mat B,D=NULL; 2006be705e3aSPierre Jolivet PetscInt bm, br; 2007be705e3aSPierre Jolivet const PetscInt *bmindices; 2008be705e3aSPierre Jolivet B = nest->m[i][j]; 2009be705e3aSPierre Jolivet if (!B) continue; 2010be705e3aSPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&flg);CHKERRQ(ierr); 2011be705e3aSPierre Jolivet if (flg) { 2012be705e3aSPierre Jolivet ierr = PetscTryMethod(B,"MatTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr); 2013be705e3aSPierre Jolivet ierr = PetscTryMethod(B,"MatHermitianTransposeGetMat_C",(Mat,Mat*),(B,&D));CHKERRQ(ierr); 2014be705e3aSPierre Jolivet ierr = MatConvert(B,((PetscObject)D)->type_name,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr); 2015be705e3aSPierre Jolivet B = D; 2016be705e3aSPierre Jolivet } 2017be705e3aSPierre Jolivet ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQSBAIJ,MATMPISBAIJ,"");CHKERRQ(ierr); 2018be705e3aSPierre Jolivet if (flg) { 2019be705e3aSPierre Jolivet if (D) { 2020be705e3aSPierre Jolivet ierr = MatConvert(D,MATBAIJ,MAT_INPLACE_MATRIX,&D);CHKERRQ(ierr); 2021be705e3aSPierre Jolivet } else { 2022be705e3aSPierre Jolivet ierr = MatConvert(B,MATBAIJ,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr); 2023be705e3aSPierre Jolivet } 2024be705e3aSPierre Jolivet B = D; 2025be705e3aSPierre Jolivet } 2026be705e3aSPierre Jolivet ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr); 2027be705e3aSPierre Jolivet ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr); 2028be705e3aSPierre Jolivet ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr); 2029be705e3aSPierre Jolivet for (br = 0; br < bm; ++br) { 2030be705e3aSPierre Jolivet PetscInt row = bmindices[br], brncols, *cols; 2031be705e3aSPierre Jolivet const PetscInt *brcols; 2032be705e3aSPierre Jolivet const PetscScalar *brcoldata; 2033be705e3aSPierre Jolivet PetscScalar *vals = NULL; 2034be705e3aSPierre Jolivet ierr = MatGetRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr); 2035be705e3aSPierre Jolivet ierr = PetscMalloc1(brncols,&cols);CHKERRQ(ierr); 2036be705e3aSPierre Jolivet for (k=0; k<brncols; k++) cols[k] = bNindices[brcols[k]]; 2037be705e3aSPierre Jolivet /* 2038be705e3aSPierre Jolivet Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match. 2039be705e3aSPierre Jolivet Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES. 2040be705e3aSPierre Jolivet */ 2041be705e3aSPierre Jolivet if (a != 1.0) { 2042be705e3aSPierre Jolivet ierr = PetscMalloc1(brncols,&vals);CHKERRQ(ierr); 2043be705e3aSPierre Jolivet for (k=0; k<brncols; k++) vals[k] = a * brcoldata[k]; 2044be705e3aSPierre Jolivet ierr = MatSetValues(Y,1,&row,brncols,cols,vals,ADD_VALUES);CHKERRQ(ierr); 2045be705e3aSPierre Jolivet ierr = PetscFree(vals);CHKERRQ(ierr); 2046be705e3aSPierre Jolivet } else { 2047be705e3aSPierre Jolivet ierr = MatSetValues(Y,1,&row,brncols,cols,brcoldata,ADD_VALUES);CHKERRQ(ierr); 2048be705e3aSPierre Jolivet } 2049be705e3aSPierre Jolivet ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,&brcoldata);CHKERRQ(ierr); 2050be705e3aSPierre Jolivet ierr = PetscFree(cols);CHKERRQ(ierr); 2051be705e3aSPierre Jolivet } 2052be705e3aSPierre Jolivet if (D) { 20531e1ea65dSPierre Jolivet ierr = MatDestroy(&D);CHKERRQ(ierr); 2054be705e3aSPierre Jolivet } 2055be705e3aSPierre Jolivet ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr); 2056be705e3aSPierre Jolivet } 2057be705e3aSPierre Jolivet ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr); 2058be705e3aSPierre Jolivet ierr = ISDestroy(&bNis);CHKERRQ(ierr); 2059be705e3aSPierre Jolivet } 2060be705e3aSPierre Jolivet ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2061be705e3aSPierre Jolivet ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2062be705e3aSPierre Jolivet PetscFunctionReturn(0); 2063be705e3aSPierre Jolivet } 2064be705e3aSPierre Jolivet 2065be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_AIJ(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 2066629c3df2SDmitry Karpeev { 2067629c3df2SDmitry Karpeev PetscErrorCode ierr; 2068629c3df2SDmitry Karpeev Mat_Nest *nest = (Mat_Nest*)A->data; 2069be705e3aSPierre Jolivet PetscInt m,n,M,N,i,j,k,*dnnz,*onnz,rstart,cstart,cend; 2070b68353e5Sstefano_zampini PetscMPIInt size; 2071629c3df2SDmitry Karpeev Mat C; 2072629c3df2SDmitry Karpeev 2073629c3df2SDmitry Karpeev PetscFunctionBegin; 2074ffc4695bSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&size);CHKERRMPI(ierr); 2075b68353e5Sstefano_zampini if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */ 2076b68353e5Sstefano_zampini PetscInt nf; 2077b68353e5Sstefano_zampini PetscBool fast; 2078b68353e5Sstefano_zampini 2079b68353e5Sstefano_zampini ierr = PetscStrcmp(newtype,MATAIJ,&fast);CHKERRQ(ierr); 2080b68353e5Sstefano_zampini if (!fast) { 2081b68353e5Sstefano_zampini ierr = PetscStrcmp(newtype,MATSEQAIJ,&fast);CHKERRQ(ierr); 2082b68353e5Sstefano_zampini } 2083b68353e5Sstefano_zampini for (i=0; i<nest->nr && fast; ++i) { 2084b68353e5Sstefano_zampini for (j=0; j<nest->nc && fast; ++j) { 2085b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 2086b68353e5Sstefano_zampini if (B) { 2087b68353e5Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&fast);CHKERRQ(ierr); 208823875855Sstefano_zampini if (!fast) { 208923875855Sstefano_zampini PetscBool istrans; 209023875855Sstefano_zampini 209123875855Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)B,MATTRANSPOSEMAT,&istrans);CHKERRQ(ierr); 209223875855Sstefano_zampini if (istrans) { 209323875855Sstefano_zampini Mat Bt; 209423875855Sstefano_zampini 209523875855Sstefano_zampini ierr = MatTransposeGetMat(B,&Bt);CHKERRQ(ierr); 209623875855Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)Bt,MATSEQAIJ,&fast);CHKERRQ(ierr); 209723875855Sstefano_zampini } 2098b68353e5Sstefano_zampini } 2099b68353e5Sstefano_zampini } 2100b68353e5Sstefano_zampini } 2101b68353e5Sstefano_zampini } 2102b68353e5Sstefano_zampini for (i=0, nf=0; i<nest->nr && fast; ++i) { 2103b68353e5Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i],ISSTRIDE,&fast);CHKERRQ(ierr); 2104b68353e5Sstefano_zampini if (fast) { 2105b68353e5Sstefano_zampini PetscInt f,s; 2106b68353e5Sstefano_zampini 2107b68353e5Sstefano_zampini ierr = ISStrideGetInfo(nest->isglobal.row[i],&f,&s);CHKERRQ(ierr); 2108b68353e5Sstefano_zampini if (f != nf || s != 1) { fast = PETSC_FALSE; } 2109b68353e5Sstefano_zampini else { 2110b68353e5Sstefano_zampini ierr = ISGetSize(nest->isglobal.row[i],&f);CHKERRQ(ierr); 2111b68353e5Sstefano_zampini nf += f; 2112b68353e5Sstefano_zampini } 2113b68353e5Sstefano_zampini } 2114b68353e5Sstefano_zampini } 2115b68353e5Sstefano_zampini for (i=0, nf=0; i<nest->nc && fast; ++i) { 2116b68353e5Sstefano_zampini ierr = PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i],ISSTRIDE,&fast);CHKERRQ(ierr); 2117b68353e5Sstefano_zampini if (fast) { 2118b68353e5Sstefano_zampini PetscInt f,s; 2119b68353e5Sstefano_zampini 2120b68353e5Sstefano_zampini ierr = ISStrideGetInfo(nest->isglobal.col[i],&f,&s);CHKERRQ(ierr); 2121b68353e5Sstefano_zampini if (f != nf || s != 1) { fast = PETSC_FALSE; } 2122b68353e5Sstefano_zampini else { 2123b68353e5Sstefano_zampini ierr = ISGetSize(nest->isglobal.col[i],&f);CHKERRQ(ierr); 2124b68353e5Sstefano_zampini nf += f; 2125b68353e5Sstefano_zampini } 2126b68353e5Sstefano_zampini } 2127b68353e5Sstefano_zampini } 2128b68353e5Sstefano_zampini if (fast) { 2129b68353e5Sstefano_zampini ierr = MatConvert_Nest_SeqAIJ_fast(A,newtype,reuse,newmat);CHKERRQ(ierr); 2130b68353e5Sstefano_zampini PetscFunctionReturn(0); 2131b68353e5Sstefano_zampini } 2132b68353e5Sstefano_zampini } 2133629c3df2SDmitry Karpeev ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr); 2134629c3df2SDmitry Karpeev ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr); 2135649b366bSFande Kong ierr = MatGetOwnershipRangeColumn(A,&cstart,&cend);CHKERRQ(ierr); 2136d1487292SPierre Jolivet if (reuse == MAT_REUSE_MATRIX) C = *newmat; 2137d1487292SPierre Jolivet else { 2138ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2139629c3df2SDmitry Karpeev ierr = MatSetType(C,newtype);CHKERRQ(ierr); 2140629c3df2SDmitry Karpeev ierr = MatSetSizes(C,m,n,M,N);CHKERRQ(ierr); 2141629c3df2SDmitry Karpeev } 2142785e854fSJed Brown ierr = PetscMalloc1(2*m,&dnnz);CHKERRQ(ierr); 2143629c3df2SDmitry Karpeev onnz = dnnz + m; 2144629c3df2SDmitry Karpeev for (k=0; k<m; k++) { 2145629c3df2SDmitry Karpeev dnnz[k] = 0; 2146629c3df2SDmitry Karpeev onnz[k] = 0; 2147629c3df2SDmitry Karpeev } 2148629c3df2SDmitry Karpeev for (j=0; j<nest->nc; ++j) { 2149629c3df2SDmitry Karpeev IS bNis; 2150629c3df2SDmitry Karpeev PetscInt bN; 2151629c3df2SDmitry Karpeev const PetscInt *bNindices; 2152629c3df2SDmitry Karpeev /* Using global column indices and ISAllGather() is not scalable. */ 2153629c3df2SDmitry Karpeev ierr = ISAllGather(nest->isglobal.col[j], &bNis);CHKERRQ(ierr); 2154629c3df2SDmitry Karpeev ierr = ISGetSize(bNis, &bN);CHKERRQ(ierr); 2155629c3df2SDmitry Karpeev ierr = ISGetIndices(bNis,&bNindices);CHKERRQ(ierr); 2156629c3df2SDmitry Karpeev for (i=0; i<nest->nr; ++i) { 2157629c3df2SDmitry Karpeev PetscSF bmsf; 2158649b366bSFande Kong PetscSFNode *iremote; 2159629c3df2SDmitry Karpeev Mat B; 2160649b366bSFande Kong PetscInt bm, *sub_dnnz,*sub_onnz, br; 2161629c3df2SDmitry Karpeev const PetscInt *bmindices; 2162629c3df2SDmitry Karpeev B = nest->m[i][j]; 2163629c3df2SDmitry Karpeev if (!B) continue; 2164629c3df2SDmitry Karpeev ierr = ISGetLocalSize(nest->isglobal.row[i],&bm);CHKERRQ(ierr); 2165629c3df2SDmitry Karpeev ierr = ISGetIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr); 2166ce94432eSBarry Smith ierr = PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf);CHKERRQ(ierr); 2167649b366bSFande Kong ierr = PetscMalloc1(bm,&iremote);CHKERRQ(ierr); 2168649b366bSFande Kong ierr = PetscMalloc1(bm,&sub_dnnz);CHKERRQ(ierr); 2169649b366bSFande Kong ierr = PetscMalloc1(bm,&sub_onnz);CHKERRQ(ierr); 2170649b366bSFande Kong for (k = 0; k < bm; ++k) { 2171649b366bSFande Kong sub_dnnz[k] = 0; 2172649b366bSFande Kong sub_onnz[k] = 0; 2173649b366bSFande Kong } 2174629c3df2SDmitry Karpeev /* 2175629c3df2SDmitry Karpeev Locate the owners for all of the locally-owned global row indices for this row block. 2176629c3df2SDmitry Karpeev These determine the roots of PetscSF used to communicate preallocation data to row owners. 2177629c3df2SDmitry Karpeev The roots correspond to the dnnz and onnz entries; thus, there are two roots per row. 2178629c3df2SDmitry Karpeev */ 217983b1a929SMark Adams ierr = MatGetOwnershipRange(B,&rstart,NULL);CHKERRQ(ierr); 2180629c3df2SDmitry Karpeev for (br = 0; br < bm; ++br) { 2181131c27b5Sprj- PetscInt row = bmindices[br], brncols, col; 2182629c3df2SDmitry Karpeev const PetscInt *brcols; 2183a4b3d3acSMatthew G Knepley PetscInt rowrel = 0; /* row's relative index on its owner rank */ 2184131c27b5Sprj- PetscMPIInt rowowner = 0; 2185629c3df2SDmitry Karpeev ierr = PetscLayoutFindOwnerIndex(A->rmap,row,&rowowner,&rowrel);CHKERRQ(ierr); 2186649b366bSFande Kong /* how many roots */ 2187649b366bSFande Kong iremote[br].rank = rowowner; iremote[br].index = rowrel; /* edge from bmdnnz to dnnz */ 2188649b366bSFande Kong /* get nonzero pattern */ 218983b1a929SMark Adams ierr = MatGetRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr); 2190629c3df2SDmitry Karpeev for (k=0; k<brncols; k++) { 2191629c3df2SDmitry Karpeev col = bNindices[brcols[k]]; 2192649b366bSFande Kong if (col>=A->cmap->range[rowowner] && col<A->cmap->range[rowowner+1]) { 2193649b366bSFande Kong sub_dnnz[br]++; 2194649b366bSFande Kong } else { 2195649b366bSFande Kong sub_onnz[br]++; 2196649b366bSFande Kong } 2197629c3df2SDmitry Karpeev } 219883b1a929SMark Adams ierr = MatRestoreRow(B,br+rstart,&brncols,&brcols,NULL);CHKERRQ(ierr); 2199629c3df2SDmitry Karpeev } 2200629c3df2SDmitry Karpeev ierr = ISRestoreIndices(nest->isglobal.row[i],&bmindices);CHKERRQ(ierr); 2201629c3df2SDmitry Karpeev /* bsf will have to take care of disposing of bedges. */ 2202649b366bSFande Kong ierr = PetscSFSetGraph(bmsf,m,bm,NULL,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER);CHKERRQ(ierr); 2203649b366bSFande Kong ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr); 2204649b366bSFande Kong ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_dnnz,dnnz,MPI_SUM);CHKERRQ(ierr); 2205649b366bSFande Kong ierr = PetscSFReduceBegin(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr); 2206649b366bSFande Kong ierr = PetscSFReduceEnd(bmsf,MPIU_INT,sub_onnz,onnz,MPI_SUM);CHKERRQ(ierr); 2207649b366bSFande Kong ierr = PetscFree(sub_dnnz);CHKERRQ(ierr); 2208649b366bSFande Kong ierr = PetscFree(sub_onnz);CHKERRQ(ierr); 2209629c3df2SDmitry Karpeev ierr = PetscSFDestroy(&bmsf);CHKERRQ(ierr); 2210629c3df2SDmitry Karpeev } 221122d28d08SBarry Smith ierr = ISRestoreIndices(bNis,&bNindices);CHKERRQ(ierr); 2212629c3df2SDmitry Karpeev ierr = ISDestroy(&bNis);CHKERRQ(ierr); 221365a4a0a3Sstefano_zampini } 221465a4a0a3Sstefano_zampini /* Resize preallocation if overestimated */ 221565a4a0a3Sstefano_zampini for (i=0;i<m;i++) { 221665a4a0a3Sstefano_zampini dnnz[i] = PetscMin(dnnz[i],A->cmap->n); 221765a4a0a3Sstefano_zampini onnz[i] = PetscMin(onnz[i],A->cmap->N - A->cmap->n); 2218629c3df2SDmitry Karpeev } 2219629c3df2SDmitry Karpeev ierr = MatSeqAIJSetPreallocation(C,0,dnnz);CHKERRQ(ierr); 2220629c3df2SDmitry Karpeev ierr = MatMPIAIJSetPreallocation(C,0,dnnz,0,onnz);CHKERRQ(ierr); 2221629c3df2SDmitry Karpeev ierr = PetscFree(dnnz);CHKERRQ(ierr); 2222be705e3aSPierre Jolivet ierr = MatAXPY_Dense_Nest(C,1.0,A);CHKERRQ(ierr); 2223d1487292SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 2224d1487292SPierre Jolivet ierr = MatHeaderReplace(A,&C);CHKERRQ(ierr); 2225d1487292SPierre Jolivet } else *newmat = C; 2226be705e3aSPierre Jolivet PetscFunctionReturn(0); 2227be705e3aSPierre Jolivet } 2228629c3df2SDmitry Karpeev 2229be705e3aSPierre Jolivet PetscErrorCode MatConvert_Nest_Dense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 2230be705e3aSPierre Jolivet { 2231629c3df2SDmitry Karpeev Mat B; 2232be705e3aSPierre Jolivet PetscInt m,n,M,N; 2233be705e3aSPierre Jolivet PetscErrorCode ierr; 2234be705e3aSPierre Jolivet 2235be705e3aSPierre Jolivet PetscFunctionBegin; 2236be705e3aSPierre Jolivet ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr); 2237be705e3aSPierre Jolivet ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr); 2238be705e3aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 2239be705e3aSPierre Jolivet B = *newmat; 2240be705e3aSPierre Jolivet ierr = MatZeroEntries(B);CHKERRQ(ierr); 2241be705e3aSPierre Jolivet } else { 2242be705e3aSPierre Jolivet ierr = MatCreateDense(PetscObjectComm((PetscObject)A),m,PETSC_DECIDE,M,N,NULL,&B);CHKERRQ(ierr); 2243629c3df2SDmitry Karpeev } 2244be705e3aSPierre Jolivet ierr = MatAXPY_Dense_Nest(B,1.0,A);CHKERRQ(ierr); 2245be705e3aSPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 2246be705e3aSPierre Jolivet ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 2247be705e3aSPierre Jolivet } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B; 2248629c3df2SDmitry Karpeev PetscFunctionReturn(0); 2249629c3df2SDmitry Karpeev } 2250629c3df2SDmitry Karpeev 22518b7d3b4bSBarry Smith PetscErrorCode MatHasOperation_Nest(Mat mat,MatOperation op,PetscBool *has) 22528b7d3b4bSBarry Smith { 22538b7d3b4bSBarry Smith Mat_Nest *bA = (Mat_Nest*)mat->data; 22543c6db4c4SPierre Jolivet MatOperation opAdd; 22558b7d3b4bSBarry Smith PetscInt i,j,nr = bA->nr,nc = bA->nc; 22568b7d3b4bSBarry Smith PetscBool flg; 225752c5f739Sprj- PetscErrorCode ierr; 225852c5f739Sprj- PetscFunctionBegin; 22598b7d3b4bSBarry Smith 226052c5f739Sprj- *has = PETSC_FALSE; 22613c6db4c4SPierre Jolivet if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) { 22623c6db4c4SPierre Jolivet opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD); 22638b7d3b4bSBarry Smith for (j=0; j<nc; j++) { 22648b7d3b4bSBarry Smith for (i=0; i<nr; i++) { 22658b7d3b4bSBarry Smith if (!bA->m[i][j]) continue; 22663c6db4c4SPierre Jolivet ierr = MatHasOperation(bA->m[i][j],opAdd,&flg);CHKERRQ(ierr); 22678b7d3b4bSBarry Smith if (!flg) PetscFunctionReturn(0); 22688b7d3b4bSBarry Smith } 22698b7d3b4bSBarry Smith } 22708b7d3b4bSBarry Smith } 22713c6db4c4SPierre Jolivet if (((void**)mat->ops)[op]) *has = PETSC_TRUE; 22728b7d3b4bSBarry Smith PetscFunctionReturn(0); 22738b7d3b4bSBarry Smith } 22748b7d3b4bSBarry Smith 2275659c6bb0SJed Brown /*MC 2276659c6bb0SJed Brown MATNEST - MATNEST = "nest" - Matrix type consisting of nested submatrices, each stored separately. 2277659c6bb0SJed Brown 2278659c6bb0SJed Brown Level: intermediate 2279659c6bb0SJed Brown 2280659c6bb0SJed Brown Notes: 2281659c6bb0SJed Brown This matrix type permits scalable use of PCFieldSplit and avoids the large memory costs of extracting submatrices. 2282659c6bb0SJed Brown It allows the use of symmetric and block formats for parts of multi-physics simulations. 2283950540a4SJed Brown It is usually used with DMComposite and DMCreateMatrix() 2284659c6bb0SJed Brown 22858b7d3b4bSBarry Smith Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero 22868b7d3b4bSBarry Smith rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes 22878b7d3b4bSBarry Smith than the nest matrix. 22888b7d3b4bSBarry Smith 228979798668SBarry Smith .seealso: MatCreate(), MatType, MatCreateNest(), MatNestSetSubMat(), MatNestGetSubMat(), 229079798668SBarry Smith VecCreateNest(), DMCreateMatrix(), DMCOMPOSITE, MatNestSetVecType(), MatNestGetLocalISs(), 229179798668SBarry Smith MatNestGetISs(), MatNestSetSubMats(), MatNestGetSubMats() 2292659c6bb0SJed Brown M*/ 22938cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A) 2294c8883902SJed Brown { 2295c8883902SJed Brown Mat_Nest *s; 2296c8883902SJed Brown PetscErrorCode ierr; 2297c8883902SJed Brown 2298c8883902SJed Brown PetscFunctionBegin; 2299b00a9115SJed Brown ierr = PetscNewLog(A,&s);CHKERRQ(ierr); 2300c8883902SJed Brown A->data = (void*)s; 2301e7c19651SJed Brown 2302e7c19651SJed Brown s->nr = -1; 2303e7c19651SJed Brown s->nc = -1; 23040298fd71SBarry Smith s->m = NULL; 2305e7c19651SJed Brown s->splitassembly = PETSC_FALSE; 2306c8883902SJed Brown 2307c8883902SJed Brown ierr = PetscMemzero(A->ops,sizeof(*A->ops));CHKERRQ(ierr); 230826fbe8dcSKarl Rupp 2309c8883902SJed Brown A->ops->mult = MatMult_Nest; 23109194d70fSJed Brown A->ops->multadd = MatMultAdd_Nest; 2311c8883902SJed Brown A->ops->multtranspose = MatMultTranspose_Nest; 23129194d70fSJed Brown A->ops->multtransposeadd = MatMultTransposeAdd_Nest; 2313f8170845SAlex Fikl A->ops->transpose = MatTranspose_Nest; 2314c8883902SJed Brown A->ops->assemblybegin = MatAssemblyBegin_Nest; 2315c8883902SJed Brown A->ops->assemblyend = MatAssemblyEnd_Nest; 2316c8883902SJed Brown A->ops->zeroentries = MatZeroEntries_Nest; 2317c222c20dSDavid Ham A->ops->copy = MatCopy_Nest; 23186e76ffeaSPierre Jolivet A->ops->axpy = MatAXPY_Nest; 2319c8883902SJed Brown A->ops->duplicate = MatDuplicate_Nest; 23207dae84e0SHong Zhang A->ops->createsubmatrix = MatCreateSubMatrix_Nest; 2321c8883902SJed Brown A->ops->destroy = MatDestroy_Nest; 2322c8883902SJed Brown A->ops->view = MatView_Nest; 2323f4259b30SLisandro Dalcin A->ops->getvecs = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */ 2324c8883902SJed Brown A->ops->getlocalsubmatrix = MatGetLocalSubMatrix_Nest; 2325c8883902SJed Brown A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest; 2326429bac76SJed Brown A->ops->getdiagonal = MatGetDiagonal_Nest; 2327429bac76SJed Brown A->ops->diagonalscale = MatDiagonalScale_Nest; 2328a061e289SJed Brown A->ops->scale = MatScale_Nest; 2329a061e289SJed Brown A->ops->shift = MatShift_Nest; 233013135bc6SAlex Fikl A->ops->diagonalset = MatDiagonalSet_Nest; 2331f8170845SAlex Fikl A->ops->setrandom = MatSetRandom_Nest; 23328b7d3b4bSBarry Smith A->ops->hasoperation = MatHasOperation_Nest; 2333381b8e50SStefano Zampini A->ops->missingdiagonal = MatMissingDiagonal_Nest; 2334c8883902SJed Brown 2335f4259b30SLisandro Dalcin A->spptr = NULL; 2336c8883902SJed Brown A->assembled = PETSC_FALSE; 2337c8883902SJed Brown 2338c8883902SJed Brown /* expose Nest api's */ 2339bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMat_C", MatNestGetSubMat_Nest);CHKERRQ(ierr); 2340bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMat_C", MatNestSetSubMat_Nest);CHKERRQ(ierr); 2341bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSubMats_C", MatNestGetSubMats_Nest);CHKERRQ(ierr); 2342bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetSize_C", MatNestGetSize_Nest);CHKERRQ(ierr); 2343bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetISs_C", MatNestGetISs_Nest);CHKERRQ(ierr); 2344bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestGetLocalISs_C", MatNestGetLocalISs_Nest);CHKERRQ(ierr); 2345bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetVecType_C", MatNestSetVecType_Nest);CHKERRQ(ierr); 2346bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatNestSetSubMats_C", MatNestSetSubMats_Nest);CHKERRQ(ierr); 23470899c546SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpiaij_C", MatConvert_Nest_AIJ);CHKERRQ(ierr); 23480899c546SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqaij_C", MatConvert_Nest_AIJ);CHKERRQ(ierr); 234983b1a929SMark Adams ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_aij_C", MatConvert_Nest_AIJ);CHKERRQ(ierr); 23505e3038f0Sstefano_zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_is_C", MatConvert_Nest_IS);CHKERRQ(ierr); 2351be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_mpidense_C",MatConvert_Nest_Dense);CHKERRQ(ierr); 2352be705e3aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_nest_seqdense_C",MatConvert_Nest_Dense);CHKERRQ(ierr); 23534222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_seqdense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr); 23544222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_mpidense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr); 23554222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_nest_dense_C",MatProductSetFromOptions_Nest_Dense);CHKERRQ(ierr); 2356c8883902SJed Brown 2357c8883902SJed Brown ierr = PetscObjectChangeTypeName((PetscObject)A,MATNEST);CHKERRQ(ierr); 2358c8883902SJed Brown PetscFunctionReturn(0); 2359c8883902SJed Brown } 2360