1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I "petscmat.h" I*/ 2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h> 30c312b8eSJed Brown #include <petscsf.h> 4d8588912SDave May 5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat, PetscInt, const IS[], PetscInt, const IS[]); 606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat, Vec *, Vec *); 706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat); 806a1af2fSStefano Zampini 95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat, MatType, MatReuse, Mat *); 10c8883902SJed Brown 11d8588912SDave May /* private functions */ 12d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetSizes_Private(Mat A, PetscInt *m, PetscInt *n, PetscInt *M, PetscInt *N) 13d71ae5a4SJacob Faibussowitsch { 14d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 158188e55aSJed Brown PetscInt i, j; 16d8588912SDave May 17d8588912SDave May PetscFunctionBegin; 188188e55aSJed Brown *m = *n = *M = *N = 0; 198188e55aSJed Brown for (i = 0; i < bA->nr; i++) { /* rows */ 208188e55aSJed Brown PetscInt sm, sM; 219566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[i], &sm)); 229566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[i], &sM)); 238188e55aSJed Brown *m += sm; 248188e55aSJed Brown *M += sM; 25d8588912SDave May } 268188e55aSJed Brown for (j = 0; j < bA->nc; j++) { /* cols */ 278188e55aSJed Brown PetscInt sn, sN; 289566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[j], &sn)); 299566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &sN)); 308188e55aSJed Brown *n += sn; 318188e55aSJed Brown *N += sN; 32d8588912SDave May } 333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34d8588912SDave May } 35d8588912SDave May 36d8588912SDave May /* operations */ 37d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_Nest(Mat A, Vec x, Vec y) 38d71ae5a4SJacob Faibussowitsch { 39d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 40207556f9SJed Brown Vec *bx = bA->right, *by = bA->left; 41207556f9SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 42d8588912SDave May 43d8588912SDave May PetscFunctionBegin; 449566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(y, bA->isglobal.row[i], &by[i])); 459566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(x, bA->isglobal.col[i], &bx[i])); 46207556f9SJed Brown for (i = 0; i < nr; i++) { 479566063dSJacob Faibussowitsch PetscCall(VecZeroEntries(by[i])); 48207556f9SJed Brown for (j = 0; j < nc; j++) { 49207556f9SJed Brown if (!bA->m[i][j]) continue; 50d8588912SDave May /* y[i] <- y[i] + A[i][j] * x[j] */ 519566063dSJacob Faibussowitsch PetscCall(MatMultAdd(bA->m[i][j], bx[j], by[i], by[i])); 52d8588912SDave May } 53d8588912SDave May } 549566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(y, bA->isglobal.row[i], &by[i])); 559566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.col[i], &bx[i])); 563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 57d8588912SDave May } 58d8588912SDave May 59d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_Nest(Mat A, Vec x, Vec y, Vec z) 60d71ae5a4SJacob Faibussowitsch { 619194d70fSJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 629194d70fSJed Brown Vec *bx = bA->right, *bz = bA->left; 639194d70fSJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 649194d70fSJed Brown 659194d70fSJed Brown PetscFunctionBegin; 669566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(z, bA->isglobal.row[i], &bz[i])); 679566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(x, bA->isglobal.col[i], &bx[i])); 689194d70fSJed Brown for (i = 0; i < nr; i++) { 699194d70fSJed Brown if (y != z) { 709194d70fSJed Brown Vec by; 719566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(y, bA->isglobal.row[i], &by)); 729566063dSJacob Faibussowitsch PetscCall(VecCopy(by, bz[i])); 739566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(y, bA->isglobal.row[i], &by)); 749194d70fSJed Brown } 759194d70fSJed Brown for (j = 0; j < nc; j++) { 769194d70fSJed Brown if (!bA->m[i][j]) continue; 779194d70fSJed Brown /* y[i] <- y[i] + A[i][j] * x[j] */ 789566063dSJacob Faibussowitsch PetscCall(MatMultAdd(bA->m[i][j], bx[j], bz[i], bz[i])); 799194d70fSJed Brown } 809194d70fSJed Brown } 819566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(z, bA->isglobal.row[i], &bz[i])); 829566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.col[i], &bx[i])); 833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 849194d70fSJed Brown } 859194d70fSJed Brown 8652c5f739Sprj- typedef struct { 8752c5f739Sprj- Mat *workC; /* array of Mat with specific containers depending on the underlying MatMatMult implementation */ 8852c5f739Sprj- PetscScalar *tarray; /* buffer for storing all temporary products A[i][j] B[j] */ 8952c5f739Sprj- PetscInt *dm, *dn, k; /* displacements and number of submatrices */ 9052c5f739Sprj- } Nest_Dense; 9152c5f739Sprj- 92a678f235SPierre Jolivet static PetscErrorCode MatProductNumeric_Nest_Dense(Mat C) 93d71ae5a4SJacob Faibussowitsch { 946718818eSStefano Zampini Mat_Nest *bA; 9552c5f739Sprj- Nest_Dense *contents; 966718818eSStefano Zampini Mat viewB, viewC, productB, workC; 9752c5f739Sprj- const PetscScalar *barray; 9852c5f739Sprj- PetscScalar *carray; 996718818eSStefano Zampini PetscInt i, j, M, N, nr, nc, ldb, ldc; 1006718818eSStefano Zampini Mat A, B; 10152c5f739Sprj- 10252c5f739Sprj- PetscFunctionBegin; 1030d6f747bSJacob Faibussowitsch MatCheckProduct(C, 1); 1046718818eSStefano Zampini A = C->product->A; 1056718818eSStefano Zampini B = C->product->B; 1069566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 1076718818eSStefano Zampini if (!N) { 1089566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 1099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 1103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1116718818eSStefano Zampini } 1126718818eSStefano Zampini contents = (Nest_Dense *)C->product->data; 11328b400f6SJacob Faibussowitsch PetscCheck(contents, PetscObjectComm((PetscObject)C), PETSC_ERR_PLIB, "Product data empty"); 1146718818eSStefano Zampini bA = (Mat_Nest *)A->data; 1156718818eSStefano Zampini nr = bA->nr; 1166718818eSStefano Zampini nc = bA->nc; 1179566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(B, &ldb)); 1189566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(C, &ldc)); 1199566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 1209566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayRead(B, &barray)); 1219566063dSJacob Faibussowitsch PetscCall(MatDenseGetArray(C, &carray)); 12252c5f739Sprj- for (i = 0; i < nr; i++) { 1239566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[i], &M)); 1248e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dm[i + 1] - contents->dm[i], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset(carray, contents->dm[i]), &viewC)); 1259566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewC, ldc)); 12652c5f739Sprj- for (j = 0; j < nc; j++) { 12752c5f739Sprj- if (!bA->m[i][j]) continue; 1289566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &M)); 1298e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dn[j + 1] - contents->dn[j], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset((PetscScalar *)barray, contents->dn[j]), &viewB)); 1309566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewB, ldb)); 1314222ddf1SHong Zhang 1324222ddf1SHong Zhang /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */ 1334222ddf1SHong Zhang workC = contents->workC[i * nc + j]; 1344222ddf1SHong Zhang productB = workC->product->B; 1354222ddf1SHong Zhang workC->product->B = viewB; /* use newly created dense matrix viewB */ 1369566063dSJacob Faibussowitsch PetscCall(MatProductNumeric(workC)); 1379566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewB)); 1384222ddf1SHong Zhang workC->product->B = productB; /* resume original B */ 1394222ddf1SHong Zhang 14052c5f739Sprj- /* C[i] <- workC + C[i] */ 1419566063dSJacob Faibussowitsch PetscCall(MatAXPY(viewC, 1.0, contents->workC[i * nc + j], SAME_NONZERO_PATTERN)); 14252c5f739Sprj- } 1439566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewC)); 14452c5f739Sprj- } 1459566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArray(C, &carray)); 1469566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArrayRead(B, &barray)); 1474222ddf1SHong Zhang 14867af85e8SPierre Jolivet PetscCall(MatSetOption(C, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 1499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 1509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 1513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15252c5f739Sprj- } 15352c5f739Sprj- 15466976f2fSJacob Faibussowitsch static PetscErrorCode MatNest_DenseDestroy(void *ctx) 155d71ae5a4SJacob Faibussowitsch { 15652c5f739Sprj- Nest_Dense *contents = (Nest_Dense *)ctx; 15752c5f739Sprj- PetscInt i; 15852c5f739Sprj- 15952c5f739Sprj- PetscFunctionBegin; 1609566063dSJacob Faibussowitsch PetscCall(PetscFree(contents->tarray)); 16148a46eb9SPierre Jolivet for (i = 0; i < contents->k; i++) PetscCall(MatDestroy(contents->workC + i)); 1629566063dSJacob Faibussowitsch PetscCall(PetscFree3(contents->dm, contents->dn, contents->workC)); 1639566063dSJacob Faibussowitsch PetscCall(PetscFree(contents)); 1643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16552c5f739Sprj- } 16652c5f739Sprj- 167a678f235SPierre Jolivet static PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C) 168d71ae5a4SJacob Faibussowitsch { 1696718818eSStefano Zampini Mat_Nest *bA; 1706718818eSStefano Zampini Mat viewB, workC; 17152c5f739Sprj- const PetscScalar *barray; 1726718818eSStefano Zampini PetscInt i, j, M, N, m, n, nr, nc, maxm = 0, ldb; 1734222ddf1SHong Zhang Nest_Dense *contents = NULL; 1746718818eSStefano Zampini PetscBool cisdense; 1756718818eSStefano Zampini Mat A, B; 1766718818eSStefano Zampini PetscReal fill; 17752c5f739Sprj- 17852c5f739Sprj- PetscFunctionBegin; 1790d6f747bSJacob Faibussowitsch MatCheckProduct(C, 1); 18028b400f6SJacob Faibussowitsch PetscCheck(!C->product->data, PetscObjectComm((PetscObject)C), PETSC_ERR_PLIB, "Product data not empty"); 1816718818eSStefano Zampini A = C->product->A; 1826718818eSStefano Zampini B = C->product->B; 1836718818eSStefano Zampini fill = C->product->fill; 1846718818eSStefano Zampini bA = (Mat_Nest *)A->data; 1856718818eSStefano Zampini nr = bA->nr; 1866718818eSStefano Zampini nc = bA->nc; 1879566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(C, &m, &n)); 1889566063dSJacob Faibussowitsch PetscCall(MatGetSize(C, &M, &N)); 1890572eedcSPierre Jolivet if (m == PETSC_DECIDE || n == PETSC_DECIDE || M == PETSC_DECIDE || N == PETSC_DECIDE) { 1909566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(B, NULL, &n)); 1919566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 1929566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, NULL)); 1939566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, NULL)); 1949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, M, N)); 1950572eedcSPierre Jolivet } 1969566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATMPIDENSE, MATSEQDENSECUDA, MATMPIDENSECUDA, "")); 19748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, ((PetscObject)B)->type_name)); 1989566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 1996718818eSStefano Zampini if (!N) { 2006718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 2013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20252c5f739Sprj- } 20352c5f739Sprj- 2049566063dSJacob Faibussowitsch PetscCall(PetscNew(&contents)); 2056718818eSStefano Zampini C->product->data = contents; 2066718818eSStefano Zampini C->product->destroy = MatNest_DenseDestroy; 2079566063dSJacob Faibussowitsch PetscCall(PetscCalloc3(nr + 1, &contents->dm, nc + 1, &contents->dn, nr * nc, &contents->workC)); 20852c5f739Sprj- contents->k = nr * nc; 20952c5f739Sprj- for (i = 0; i < nr; i++) { 2109566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[i], contents->dm + i + 1)); 21152c5f739Sprj- maxm = PetscMax(maxm, contents->dm[i + 1]); 21252c5f739Sprj- contents->dm[i + 1] += contents->dm[i]; 21352c5f739Sprj- } 21452c5f739Sprj- for (i = 0; i < nc; i++) { 2159566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[i], contents->dn + i + 1)); 21652c5f739Sprj- contents->dn[i + 1] += contents->dn[i]; 21752c5f739Sprj- } 2189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(maxm * N, &contents->tarray)); 2199566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(B, &ldb)); 2209566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 2219566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayRead(B, &barray)); 22252c5f739Sprj- /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */ 22352c5f739Sprj- for (j = 0; j < nc; j++) { 2249566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &M)); 2258e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dn[j + 1] - contents->dn[j], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset((PetscScalar *)barray, contents->dn[j]), &viewB)); 2269566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewB, ldb)); 22752c5f739Sprj- for (i = 0; i < nr; i++) { 22852c5f739Sprj- if (!bA->m[i][j]) continue; 22952c5f739Sprj- /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */ 2304222ddf1SHong Zhang 2319566063dSJacob Faibussowitsch PetscCall(MatProductCreate(bA->m[i][j], viewB, NULL, &contents->workC[i * nc + j])); 2324222ddf1SHong Zhang workC = contents->workC[i * nc + j]; 2339566063dSJacob Faibussowitsch PetscCall(MatProductSetType(workC, MATPRODUCT_AB)); 2349566063dSJacob Faibussowitsch PetscCall(MatProductSetAlgorithm(workC, "default")); 2359566063dSJacob Faibussowitsch PetscCall(MatProductSetFill(workC, fill)); 2369566063dSJacob Faibussowitsch PetscCall(MatProductSetFromOptions(workC)); 2379566063dSJacob Faibussowitsch PetscCall(MatProductSymbolic(workC)); 2384222ddf1SHong Zhang 2396718818eSStefano Zampini /* since tarray will be shared by all Mat */ 2409566063dSJacob Faibussowitsch PetscCall(MatSeqDenseSetPreallocation(workC, contents->tarray)); 2419566063dSJacob Faibussowitsch PetscCall(MatMPIDenseSetPreallocation(workC, contents->tarray)); 24252c5f739Sprj- } 2439566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewB)); 24452c5f739Sprj- } 2459566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArrayRead(B, &barray)); 24652c5f739Sprj- 2476718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 2483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24952c5f739Sprj- } 25052c5f739Sprj- 251a678f235SPierre Jolivet static PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C) 252d71ae5a4SJacob Faibussowitsch { 2534222ddf1SHong Zhang Mat_Product *product = C->product; 25452c5f739Sprj- 25552c5f739Sprj- PetscFunctionBegin; 256c57d7d18SPierre Jolivet if (product->type == MATPRODUCT_AB) C->ops->productsymbolic = MatProductSymbolic_Nest_Dense; 2573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 25852c5f739Sprj- } 25952c5f739Sprj- 2600998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeKernel_Nest(Mat A, Vec x, Vec y, PetscBool herm) 261d71ae5a4SJacob Faibussowitsch { 262d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 263207556f9SJed Brown Vec *bx = bA->left, *by = bA->right; 264207556f9SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 265d8588912SDave May 266d8588912SDave May PetscFunctionBegin; 2679566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(x, bA->isglobal.row[i], &bx[i])); 2689566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(y, bA->isglobal.col[i], &by[i])); 269207556f9SJed Brown for (j = 0; j < nc; j++) { 2709566063dSJacob Faibussowitsch PetscCall(VecZeroEntries(by[j])); 271609e31cbSJed Brown for (i = 0; i < nr; i++) { 2726c75ac25SJed Brown if (!bA->m[i][j]) continue; 2730998551bSBlanca Mellado Pinto if (herm) PetscCall(MatMultHermitianTransposeAdd(bA->m[i][j], bx[i], by[j], by[j])); /* y[j] <- y[j] + (A[i][j])^H * x[i] */ 2740998551bSBlanca Mellado Pinto else PetscCall(MatMultTransposeAdd(bA->m[i][j], bx[i], by[j], by[j])); /* y[j] <- y[j] + (A[i][j])^T * x[i] */ 275d8588912SDave May } 276d8588912SDave May } 2779566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.row[i], &bx[i])); 2789566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(y, bA->isglobal.col[i], &by[i])); 2793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 280d8588912SDave May } 281d8588912SDave May 2820998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTranspose_Nest(Mat A, Vec x, Vec y) 2830998551bSBlanca Mellado Pinto { 2840998551bSBlanca Mellado Pinto PetscFunctionBegin; 2850998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeKernel_Nest(A, x, y, PETSC_FALSE)); 2860998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 2870998551bSBlanca Mellado Pinto } 2880998551bSBlanca Mellado Pinto 2890998551bSBlanca Mellado Pinto static PetscErrorCode MatMultHermitianTranspose_Nest(Mat A, Vec x, Vec y) 2900998551bSBlanca Mellado Pinto { 2910998551bSBlanca Mellado Pinto PetscFunctionBegin; 2920998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeKernel_Nest(A, x, y, PETSC_TRUE)); 2930998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 2940998551bSBlanca Mellado Pinto } 2950998551bSBlanca Mellado Pinto 2960998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeAddKernel_Nest(Mat A, Vec x, Vec y, Vec z, PetscBool herm) 297d71ae5a4SJacob Faibussowitsch { 2989194d70fSJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 2999194d70fSJed Brown Vec *bx = bA->left, *bz = bA->right; 3009194d70fSJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 3019194d70fSJed Brown 3029194d70fSJed Brown PetscFunctionBegin; 3039566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(x, bA->isglobal.row[i], &bx[i])); 3049566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(z, bA->isglobal.col[i], &bz[i])); 3059194d70fSJed Brown for (j = 0; j < nc; j++) { 3069194d70fSJed Brown if (y != z) { 3079194d70fSJed Brown Vec by; 3089566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(y, bA->isglobal.col[j], &by)); 3099566063dSJacob Faibussowitsch PetscCall(VecCopy(by, bz[j])); 3109566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(y, bA->isglobal.col[j], &by)); 3119194d70fSJed Brown } 3129194d70fSJed Brown for (i = 0; i < nr; i++) { 3136c75ac25SJed Brown if (!bA->m[i][j]) continue; 3140998551bSBlanca Mellado Pinto if (herm) PetscCall(MatMultHermitianTransposeAdd(bA->m[i][j], bx[i], bz[j], bz[j])); /* z[j] <- y[j] + (A[i][j])^H * x[i] */ 3150998551bSBlanca Mellado Pinto else PetscCall(MatMultTransposeAdd(bA->m[i][j], bx[i], bz[j], bz[j])); /* z[j] <- y[j] + (A[i][j])^T * x[i] */ 3169194d70fSJed Brown } 3179194d70fSJed Brown } 3189566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.row[i], &bx[i])); 3199566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(z, bA->isglobal.col[i], &bz[i])); 3203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3219194d70fSJed Brown } 3229194d70fSJed Brown 3230998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeAdd_Nest(Mat A, Vec x, Vec y, Vec z) 3240998551bSBlanca Mellado Pinto { 3250998551bSBlanca Mellado Pinto PetscFunctionBegin; 3260998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeAddKernel_Nest(A, x, y, z, PETSC_FALSE)); 3270998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 3280998551bSBlanca Mellado Pinto } 3290998551bSBlanca Mellado Pinto 3300998551bSBlanca Mellado Pinto static PetscErrorCode MatMultHermitianTransposeAdd_Nest(Mat A, Vec x, Vec y, Vec z) 3310998551bSBlanca Mellado Pinto { 3320998551bSBlanca Mellado Pinto PetscFunctionBegin; 3330998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeAddKernel_Nest(A, x, y, z, PETSC_TRUE)); 3340998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 3350998551bSBlanca Mellado Pinto } 3360998551bSBlanca Mellado Pinto 337d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatTranspose_Nest(Mat A, MatReuse reuse, Mat *B) 338d71ae5a4SJacob Faibussowitsch { 339f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data, *bC; 340f8170845SAlex Fikl Mat C; 341f8170845SAlex Fikl PetscInt i, j, nr = bA->nr, nc = bA->nc; 342f8170845SAlex Fikl 343f8170845SAlex Fikl PetscFunctionBegin; 3447fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 345aed4548fSBarry Smith PetscCheck(reuse != MAT_INPLACE_MATRIX || nr == nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_SIZ, "Square nested matrix only for in-place"); 346f8170845SAlex Fikl 347cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) { 348f8170845SAlex Fikl Mat *subs; 349f8170845SAlex Fikl IS *is_row, *is_col; 350f8170845SAlex Fikl 3519566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr * nc, &subs)); 3529566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nr, &is_row, nc, &is_col)); 3539566063dSJacob Faibussowitsch PetscCall(MatNestGetISs(A, is_row, is_col)); 354cf37664fSBarry Smith if (reuse == MAT_INPLACE_MATRIX) { 355ddeb9bd8SAlex Fikl for (i = 0; i < nr; i++) { 356ad540459SPierre Jolivet for (j = 0; j < nc; j++) subs[i + nr * j] = bA->m[i][j]; 357ddeb9bd8SAlex Fikl } 358ddeb9bd8SAlex Fikl } 359ddeb9bd8SAlex Fikl 3609566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nc, is_col, nr, is_row, subs, &C)); 3619566063dSJacob Faibussowitsch PetscCall(PetscFree(subs)); 3629566063dSJacob Faibussowitsch PetscCall(PetscFree2(is_row, is_col)); 363f8170845SAlex Fikl } else { 364f8170845SAlex Fikl C = *B; 365f8170845SAlex Fikl } 366f8170845SAlex Fikl 367f8170845SAlex Fikl bC = (Mat_Nest *)C->data; 368f8170845SAlex Fikl for (i = 0; i < nr; i++) { 369f8170845SAlex Fikl for (j = 0; j < nc; j++) { 370f8170845SAlex Fikl if (bA->m[i][j]) { 371f4f49eeaSPierre Jolivet PetscCall(MatTranspose(bA->m[i][j], reuse, &bC->m[j][i])); 372f8170845SAlex Fikl } else { 373f8170845SAlex Fikl bC->m[j][i] = NULL; 374f8170845SAlex Fikl } 375f8170845SAlex Fikl } 376f8170845SAlex Fikl } 377f8170845SAlex Fikl 378cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) { 379f8170845SAlex Fikl *B = C; 380f8170845SAlex Fikl } else { 3819566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(A, &C)); 382f8170845SAlex Fikl } 3833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 384f8170845SAlex Fikl } 385f8170845SAlex Fikl 386d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestDestroyISList(PetscInt n, IS **list) 387d71ae5a4SJacob Faibussowitsch { 388e2d7f03fSJed Brown IS *lst = *list; 389e2d7f03fSJed Brown PetscInt i; 390e2d7f03fSJed Brown 391e2d7f03fSJed Brown PetscFunctionBegin; 3923ba16761SJacob Faibussowitsch if (!lst) PetscFunctionReturn(PETSC_SUCCESS); 3939371c9d4SSatish Balay for (i = 0; i < n; i++) 3949371c9d4SSatish Balay if (lst[i]) PetscCall(ISDestroy(&lst[i])); 3959566063dSJacob Faibussowitsch PetscCall(PetscFree(lst)); 3960298fd71SBarry Smith *list = NULL; 3973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 398e2d7f03fSJed Brown } 399e2d7f03fSJed Brown 400d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatReset_Nest(Mat A) 401d71ae5a4SJacob Faibussowitsch { 402d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 403d8588912SDave May PetscInt i, j; 404d8588912SDave May 405d8588912SDave May PetscFunctionBegin; 406d8588912SDave May /* release the matrices and the place holders */ 4079566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nr, &vs->isglobal.row)); 4089566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nc, &vs->isglobal.col)); 4099566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nr, &vs->islocal.row)); 4109566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nc, &vs->islocal.col)); 411d8588912SDave May 4129566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->row_len)); 4139566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->col_len)); 4149566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->nnzstate)); 415d8588912SDave May 4169566063dSJacob Faibussowitsch PetscCall(PetscFree2(vs->left, vs->right)); 417207556f9SJed Brown 418d8588912SDave May /* release the matrices and the place holders */ 419d8588912SDave May if (vs->m) { 420d8588912SDave May for (i = 0; i < vs->nr; i++) { 42148a46eb9SPierre Jolivet for (j = 0; j < vs->nc; j++) PetscCall(MatDestroy(&vs->m[i][j])); 422d8588912SDave May } 4238068ee9dSPierre Jolivet PetscCall(PetscFree(vs->m[0])); 4249566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->m)); 425d8588912SDave May } 42606a1af2fSStefano Zampini 42706a1af2fSStefano Zampini /* restore defaults */ 42806a1af2fSStefano Zampini vs->nr = 0; 42906a1af2fSStefano Zampini vs->nc = 0; 43006a1af2fSStefano Zampini vs->splitassembly = PETSC_FALSE; 4313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 43206a1af2fSStefano Zampini } 43306a1af2fSStefano Zampini 434d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_Nest(Mat A) 435d71ae5a4SJacob Faibussowitsch { 436362febeeSStefano Zampini PetscFunctionBegin; 4379566063dSJacob Faibussowitsch PetscCall(MatReset_Nest(A)); 4389566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 4399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMat_C", NULL)); 4409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMat_C", NULL)); 4419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMats_C", NULL)); 4429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSize_C", NULL)); 4439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetISs_C", NULL)); 4449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetLocalISs_C", NULL)); 4459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetVecType_C", NULL)); 4469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMats_C", NULL)); 4479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpiaij_C", NULL)); 4489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqaij_C", NULL)); 4499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_aij_C", NULL)); 4509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_is_C", NULL)); 4519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpidense_C", NULL)); 4529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqdense_C", NULL)); 4539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_seqdense_C", NULL)); 4549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_mpidense_C", NULL)); 4553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 456d8588912SDave May } 457d8588912SDave May 458d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_Nest(Mat mat, PetscBool *missing, PetscInt *dd) 459d71ae5a4SJacob Faibussowitsch { 460381b8e50SStefano Zampini Mat_Nest *vs = (Mat_Nest *)mat->data; 461381b8e50SStefano Zampini PetscInt i; 462381b8e50SStefano Zampini 463381b8e50SStefano Zampini PetscFunctionBegin; 464381b8e50SStefano Zampini if (dd) *dd = 0; 465381b8e50SStefano Zampini if (!vs->nr) { 466381b8e50SStefano Zampini *missing = PETSC_TRUE; 4673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 468381b8e50SStefano Zampini } 469381b8e50SStefano Zampini *missing = PETSC_FALSE; 470381b8e50SStefano Zampini for (i = 0; i < vs->nr && !(*missing); i++) { 471381b8e50SStefano Zampini *missing = PETSC_TRUE; 472381b8e50SStefano Zampini if (vs->m[i][i]) { 4739566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal(vs->m[i][i], missing, NULL)); 47408401ef6SPierre Jolivet PetscCheck(!*missing || !dd, PetscObjectComm((PetscObject)mat), PETSC_ERR_SUP, "First missing entry not yet implemented"); 475381b8e50SStefano Zampini } 476381b8e50SStefano Zampini } 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 478381b8e50SStefano Zampini } 479381b8e50SStefano Zampini 480d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_Nest(Mat A, MatAssemblyType type) 481d71ae5a4SJacob Faibussowitsch { 482d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 483d8588912SDave May PetscInt i, j; 48406a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 485d8588912SDave May 486d8588912SDave May PetscFunctionBegin; 487d8588912SDave May for (i = 0; i < vs->nr; i++) { 488d8588912SDave May for (j = 0; j < vs->nc; j++) { 48906a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 490e7c19651SJed Brown if (vs->m[i][j]) { 4919566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(vs->m[i][j], type)); 492e7c19651SJed Brown if (!vs->splitassembly) { 493e7c19651SJed Brown /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested 494e7c19651SJed Brown * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was 495e7c19651SJed Brown * already performing an assembly, but the result would by more complicated and appears to offer less 496e7c19651SJed Brown * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an 497e7c19651SJed Brown * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives". 498e7c19651SJed Brown */ 4999566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(vs->m[i][j], type)); 5009566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(vs->m[i][j], &subnnzstate)); 501e7c19651SJed Brown } 502e7c19651SJed Brown } 50306a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i * vs->nc + j] != subnnzstate); 50406a1af2fSStefano Zampini vs->nnzstate[i * vs->nc + j] = subnnzstate; 505d8588912SDave May } 506d8588912SDave May } 50706a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 5083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 509d8588912SDave May } 510d8588912SDave May 511d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type) 512d71ae5a4SJacob Faibussowitsch { 513d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 514d8588912SDave May PetscInt i, j; 515d8588912SDave May 516d8588912SDave May PetscFunctionBegin; 517d8588912SDave May for (i = 0; i < vs->nr; i++) { 518d8588912SDave May for (j = 0; j < vs->nc; j++) { 519e7c19651SJed Brown if (vs->m[i][j]) { 52048a46eb9SPierre Jolivet if (vs->splitassembly) PetscCall(MatAssemblyEnd(vs->m[i][j], type)); 521e7c19651SJed Brown } 522d8588912SDave May } 523d8588912SDave May } 5243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 525d8588912SDave May } 526d8588912SDave May 527d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A, PetscInt row, Mat *B) 528d71ae5a4SJacob Faibussowitsch { 529f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 530f349c1fdSJed Brown PetscInt j; 531f349c1fdSJed Brown Mat sub; 532d8588912SDave May 533d8588912SDave May PetscFunctionBegin; 5340298fd71SBarry Smith sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */ 535f349c1fdSJed Brown for (j = 0; !sub && j < vs->nc; j++) sub = vs->m[row][j]; 5369566063dSJacob Faibussowitsch if (sub) PetscCall(MatSetUp(sub)); /* Ensure that the sizes are available */ 537f349c1fdSJed Brown *B = sub; 5383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 539d8588912SDave May } 540d8588912SDave May 541d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A, PetscInt col, Mat *B) 542d71ae5a4SJacob Faibussowitsch { 543f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 544f349c1fdSJed Brown PetscInt i; 545f349c1fdSJed Brown Mat sub; 546f349c1fdSJed Brown 547f349c1fdSJed Brown PetscFunctionBegin; 5480298fd71SBarry Smith sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */ 549f349c1fdSJed Brown for (i = 0; !sub && i < vs->nr; i++) sub = vs->m[i][col]; 5509566063dSJacob Faibussowitsch if (sub) PetscCall(MatSetUp(sub)); /* Ensure that the sizes are available */ 551f349c1fdSJed Brown *B = sub; 5523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 553d8588912SDave May } 554d8588912SDave May 555d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindISRange(Mat A, PetscInt n, const IS list[], IS is, PetscInt *begin, PetscInt *end) 556d71ae5a4SJacob Faibussowitsch { 55718d228c0SPierre Jolivet PetscInt i, j, size, m; 558f349c1fdSJed Brown PetscBool flg; 55918d228c0SPierre Jolivet IS out, concatenate[2]; 560f349c1fdSJed Brown 561f349c1fdSJed Brown PetscFunctionBegin; 5624f572ea9SToby Isaac PetscAssertPointer(list, 3); 563f349c1fdSJed Brown PetscValidHeaderSpecific(is, IS_CLASSID, 4); 56418d228c0SPierre Jolivet if (begin) { 5654f572ea9SToby Isaac PetscAssertPointer(begin, 5); 56618d228c0SPierre Jolivet *begin = -1; 56718d228c0SPierre Jolivet } 56818d228c0SPierre Jolivet if (end) { 5694f572ea9SToby Isaac PetscAssertPointer(end, 6); 57018d228c0SPierre Jolivet *end = -1; 57118d228c0SPierre Jolivet } 572f349c1fdSJed Brown for (i = 0; i < n; i++) { 573207556f9SJed Brown if (!list[i]) continue; 5749566063dSJacob Faibussowitsch PetscCall(ISEqualUnsorted(list[i], is, &flg)); 575f349c1fdSJed Brown if (flg) { 57618d228c0SPierre Jolivet if (begin) *begin = i; 57718d228c0SPierre Jolivet if (end) *end = i + 1; 5783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 579f349c1fdSJed Brown } 580f349c1fdSJed Brown } 5819566063dSJacob Faibussowitsch PetscCall(ISGetSize(is, &size)); 58218d228c0SPierre Jolivet for (i = 0; i < n - 1; i++) { 58318d228c0SPierre Jolivet if (!list[i]) continue; 58418d228c0SPierre Jolivet m = 0; 5859566063dSJacob Faibussowitsch PetscCall(ISConcatenate(PetscObjectComm((PetscObject)A), 2, list + i, &out)); 5869566063dSJacob Faibussowitsch PetscCall(ISGetSize(out, &m)); 58718d228c0SPierre Jolivet for (j = i + 2; j < n && m < size; j++) { 58818d228c0SPierre Jolivet if (list[j]) { 58918d228c0SPierre Jolivet concatenate[0] = out; 59018d228c0SPierre Jolivet concatenate[1] = list[j]; 5919566063dSJacob Faibussowitsch PetscCall(ISConcatenate(PetscObjectComm((PetscObject)A), 2, concatenate, &out)); 5929566063dSJacob Faibussowitsch PetscCall(ISDestroy(concatenate)); 5939566063dSJacob Faibussowitsch PetscCall(ISGetSize(out, &m)); 59418d228c0SPierre Jolivet } 59518d228c0SPierre Jolivet } 59618d228c0SPierre Jolivet if (m == size) { 5979566063dSJacob Faibussowitsch PetscCall(ISEqualUnsorted(out, is, &flg)); 59818d228c0SPierre Jolivet if (flg) { 59918d228c0SPierre Jolivet if (begin) *begin = i; 60018d228c0SPierre Jolivet if (end) *end = j; 6019566063dSJacob Faibussowitsch PetscCall(ISDestroy(&out)); 6023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 60318d228c0SPierre Jolivet } 60418d228c0SPierre Jolivet } 6059566063dSJacob Faibussowitsch PetscCall(ISDestroy(&out)); 60618d228c0SPierre Jolivet } 6073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 608f349c1fdSJed Brown } 609f349c1fdSJed Brown 610d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFillEmptyMat_Private(Mat A, PetscInt i, PetscInt j, Mat *B) 611d71ae5a4SJacob Faibussowitsch { 6128188e55aSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 61318d228c0SPierre Jolivet PetscInt lr, lc; 61418d228c0SPierre Jolivet 61518d228c0SPierre Jolivet PetscFunctionBegin; 6169566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 6179566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.row[i], &lr)); 6189566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.col[j], &lc)); 6199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, lr, lc, PETSC_DECIDE, PETSC_DECIDE)); 6209566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATAIJ)); 6219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(*B, 0, NULL)); 6229566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(*B, 0, NULL, 0, NULL)); 6239566063dSJacob Faibussowitsch PetscCall(MatSetUp(*B)); 6249566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 6259566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 6269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 6273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 62818d228c0SPierre Jolivet } 62918d228c0SPierre Jolivet 630d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetBlock_Private(Mat A, PetscInt rbegin, PetscInt rend, PetscInt cbegin, PetscInt cend, Mat *B) 631d71ae5a4SJacob Faibussowitsch { 63218d228c0SPierre Jolivet Mat_Nest *vs = (Mat_Nest *)A->data; 63318d228c0SPierre Jolivet Mat *a; 63418d228c0SPierre Jolivet PetscInt i, j, k, l, nr = rend - rbegin, nc = cend - cbegin; 6358188e55aSJed Brown char keyname[256]; 63618d228c0SPierre Jolivet PetscBool *b; 63718d228c0SPierre Jolivet PetscBool flg; 6388188e55aSJed Brown 6398188e55aSJed Brown PetscFunctionBegin; 6400298fd71SBarry Smith *B = NULL; 6419566063dSJacob Faibussowitsch PetscCall(PetscSNPrintf(keyname, sizeof(keyname), "NestBlock_%" PetscInt_FMT "-%" PetscInt_FMT "x%" PetscInt_FMT "-%" PetscInt_FMT, rbegin, rend, cbegin, cend)); 6429566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, keyname, (PetscObject *)B)); 6433ba16761SJacob Faibussowitsch if (*B) PetscFunctionReturn(PETSC_SUCCESS); 6448188e55aSJed Brown 6459566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nr * nc, &a, nr * nc, &b)); 64618d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 64718d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 64818d228c0SPierre Jolivet a[i * nc + j] = vs->m[rbegin + i][cbegin + j]; 64918d228c0SPierre Jolivet b[i * nc + j] = PETSC_FALSE; 65018d228c0SPierre Jolivet } 65118d228c0SPierre Jolivet } 65218d228c0SPierre Jolivet if (nc != vs->nc && nr != vs->nr) { 65318d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 65418d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 65518d228c0SPierre Jolivet flg = PETSC_FALSE; 65618d228c0SPierre Jolivet for (k = 0; (k < nr && !flg); k++) { 65718d228c0SPierre Jolivet if (a[j + k * nc]) flg = PETSC_TRUE; 65818d228c0SPierre Jolivet } 65918d228c0SPierre Jolivet if (flg) { 66018d228c0SPierre Jolivet flg = PETSC_FALSE; 66118d228c0SPierre Jolivet for (l = 0; (l < nc && !flg); l++) { 66218d228c0SPierre Jolivet if (a[i * nc + l]) flg = PETSC_TRUE; 66318d228c0SPierre Jolivet } 66418d228c0SPierre Jolivet } 66518d228c0SPierre Jolivet if (!flg) { 66618d228c0SPierre Jolivet b[i * nc + j] = PETSC_TRUE; 6679566063dSJacob Faibussowitsch PetscCall(MatNestFillEmptyMat_Private(A, rbegin + i, cbegin + j, a + i * nc + j)); 66818d228c0SPierre Jolivet } 66918d228c0SPierre Jolivet } 67018d228c0SPierre Jolivet } 67118d228c0SPierre Jolivet } 6729566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nr, nr != vs->nr ? NULL : vs->isglobal.row, nc, nc != vs->nc ? NULL : vs->isglobal.col, a, B)); 67318d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 67418d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 67548a46eb9SPierre Jolivet if (b[i * nc + j]) PetscCall(MatDestroy(a + i * nc + j)); 67618d228c0SPierre Jolivet } 67718d228c0SPierre Jolivet } 6789566063dSJacob Faibussowitsch PetscCall(PetscFree2(a, b)); 6798188e55aSJed Brown (*B)->assembled = A->assembled; 6809566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, keyname, (PetscObject)*B)); 6819566063dSJacob Faibussowitsch PetscCall(PetscObjectDereference((PetscObject)*B)); /* Leave the only remaining reference in the composition */ 6823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6838188e55aSJed Brown } 6848188e55aSJed Brown 685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindSubMat(Mat A, struct MatNestISPair *is, IS isrow, IS iscol, Mat *B) 686d71ae5a4SJacob Faibussowitsch { 687f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 68818d228c0SPierre Jolivet PetscInt rbegin, rend, cbegin, cend; 689f349c1fdSJed Brown 690f349c1fdSJed Brown PetscFunctionBegin; 6919566063dSJacob Faibussowitsch PetscCall(MatNestFindISRange(A, vs->nr, is->row, isrow, &rbegin, &rend)); 6929566063dSJacob Faibussowitsch PetscCall(MatNestFindISRange(A, vs->nc, is->col, iscol, &cbegin, &cend)); 69318d228c0SPierre Jolivet if (rend == rbegin + 1 && cend == cbegin + 1) { 69448a46eb9SPierre Jolivet if (!vs->m[rbegin][cbegin]) PetscCall(MatNestFillEmptyMat_Private(A, rbegin, cbegin, vs->m[rbegin] + cbegin)); 69518d228c0SPierre Jolivet *B = vs->m[rbegin][cbegin]; 69618d228c0SPierre Jolivet } else if (rbegin != -1 && cbegin != -1) { 6979566063dSJacob Faibussowitsch PetscCall(MatNestGetBlock_Private(A, rbegin, rend, cbegin, cend, B)); 69818d228c0SPierre Jolivet } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Could not find index set"); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 700f349c1fdSJed Brown } 701f349c1fdSJed Brown 70206a1af2fSStefano Zampini /* 70306a1af2fSStefano Zampini TODO: This does not actually returns a submatrix we can modify 70406a1af2fSStefano Zampini */ 705d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrix_Nest(Mat A, IS isrow, IS iscol, MatReuse reuse, Mat *B) 706d71ae5a4SJacob Faibussowitsch { 707f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 708f349c1fdSJed Brown Mat sub; 709f349c1fdSJed Brown 710f349c1fdSJed Brown PetscFunctionBegin; 7119566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->isglobal, isrow, iscol, &sub)); 712f349c1fdSJed Brown switch (reuse) { 713f349c1fdSJed Brown case MAT_INITIAL_MATRIX: 7149566063dSJacob Faibussowitsch if (sub) PetscCall(PetscObjectReference((PetscObject)sub)); 715f349c1fdSJed Brown *B = sub; 716f349c1fdSJed Brown break; 717d71ae5a4SJacob Faibussowitsch case MAT_REUSE_MATRIX: 718d71ae5a4SJacob Faibussowitsch PetscCheck(sub == *B, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Submatrix was not used before in this call"); 719d71ae5a4SJacob Faibussowitsch break; 720d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_MATRIX: /* Nothing to do */ 721d71ae5a4SJacob Faibussowitsch break; 722d71ae5a4SJacob Faibussowitsch case MAT_INPLACE_MATRIX: /* Nothing to do */ 723d71ae5a4SJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_INPLACE_MATRIX is not supported yet"); 724f349c1fdSJed Brown } 7253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 726f349c1fdSJed Brown } 727f349c1fdSJed Brown 72866976f2fSJacob Faibussowitsch static PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A, IS isrow, IS iscol, Mat *B) 729d71ae5a4SJacob Faibussowitsch { 730f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 731f349c1fdSJed Brown Mat sub; 732f349c1fdSJed Brown 733f349c1fdSJed Brown PetscFunctionBegin; 7349566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->islocal, isrow, iscol, &sub)); 735f349c1fdSJed Brown /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */ 7369566063dSJacob Faibussowitsch if (sub) PetscCall(PetscObjectReference((PetscObject)sub)); 737f349c1fdSJed Brown *B = sub; 7383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 739d8588912SDave May } 740d8588912SDave May 741d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A, IS isrow, IS iscol, Mat *B) 742d71ae5a4SJacob Faibussowitsch { 743f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 744f349c1fdSJed Brown Mat sub; 745d8588912SDave May 746d8588912SDave May PetscFunctionBegin; 7479566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->islocal, isrow, iscol, &sub)); 74808401ef6SPierre Jolivet PetscCheck(*B == sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Local submatrix has not been gotten"); 749f349c1fdSJed Brown if (sub) { 750aed4548fSBarry Smith PetscCheck(((PetscObject)sub)->refct > 1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Local submatrix has had reference count decremented too many times"); 7519566063dSJacob Faibussowitsch PetscCall(MatDestroy(B)); 752d8588912SDave May } 7533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 754d8588912SDave May } 755d8588912SDave May 756d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_Nest(Mat A, Vec v) 757d71ae5a4SJacob Faibussowitsch { 7587874fa86SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 7597874fa86SDave May PetscInt i; 7607874fa86SDave May 7617874fa86SDave May PetscFunctionBegin; 7627874fa86SDave May for (i = 0; i < bA->nr; i++) { 763429bac76SJed Brown Vec bv; 7649566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(v, bA->isglobal.row[i], &bv)); 7657874fa86SDave May if (bA->m[i][i]) { 7669566063dSJacob Faibussowitsch PetscCall(MatGetDiagonal(bA->m[i][i], bv)); 7677874fa86SDave May } else { 7689566063dSJacob Faibussowitsch PetscCall(VecSet(bv, 0.0)); 7697874fa86SDave May } 7709566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(v, bA->isglobal.row[i], &bv)); 7717874fa86SDave May } 7723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7737874fa86SDave May } 7747874fa86SDave May 775d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDiagonalScale_Nest(Mat A, Vec l, Vec r) 776d71ae5a4SJacob Faibussowitsch { 7777874fa86SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 778429bac76SJed Brown Vec bl, *br; 7797874fa86SDave May PetscInt i, j; 7807874fa86SDave May 7817874fa86SDave May PetscFunctionBegin; 7829566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(bA->nc, &br)); 7832e6472ebSElliott Sales de Andrade if (r) { 7849566063dSJacob Faibussowitsch for (j = 0; j < bA->nc; j++) PetscCall(VecGetSubVector(r, bA->isglobal.col[j], &br[j])); 7852e6472ebSElliott Sales de Andrade } 7862e6472ebSElliott Sales de Andrade bl = NULL; 7877874fa86SDave May for (i = 0; i < bA->nr; i++) { 78848a46eb9SPierre Jolivet if (l) PetscCall(VecGetSubVector(l, bA->isglobal.row[i], &bl)); 7897874fa86SDave May for (j = 0; j < bA->nc; j++) { 79048a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatDiagonalScale(bA->m[i][j], bl, br[j])); 7917874fa86SDave May } 79248a46eb9SPierre Jolivet if (l) PetscCall(VecRestoreSubVector(l, bA->isglobal.row[i], &bl)); 7932e6472ebSElliott Sales de Andrade } 7942e6472ebSElliott Sales de Andrade if (r) { 7959566063dSJacob Faibussowitsch for (j = 0; j < bA->nc; j++) PetscCall(VecRestoreSubVector(r, bA->isglobal.col[j], &br[j])); 7962e6472ebSElliott Sales de Andrade } 7979566063dSJacob Faibussowitsch PetscCall(PetscFree(br)); 7983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7997874fa86SDave May } 8007874fa86SDave May 801d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_Nest(Mat A, PetscScalar a) 802d71ae5a4SJacob Faibussowitsch { 803a061e289SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 804a061e289SJed Brown PetscInt i, j; 805a061e289SJed Brown 806a061e289SJed Brown PetscFunctionBegin; 807a061e289SJed Brown for (i = 0; i < bA->nr; i++) { 808a061e289SJed Brown for (j = 0; j < bA->nc; j++) { 80948a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatScale(bA->m[i][j], a)); 810a061e289SJed Brown } 811a061e289SJed Brown } 8123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a061e289SJed Brown } 814a061e289SJed Brown 815d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatShift_Nest(Mat A, PetscScalar a) 816d71ae5a4SJacob Faibussowitsch { 817a061e289SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 818a061e289SJed Brown PetscInt i; 81906a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 820a061e289SJed Brown 821a061e289SJed Brown PetscFunctionBegin; 822a061e289SJed Brown for (i = 0; i < bA->nr; i++) { 82306a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 82408401ef6SPierre Jolivet PetscCheck(bA->m[i][i], PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "No support for shifting an empty diagonal block, insert a matrix in block (%" PetscInt_FMT ",%" PetscInt_FMT ")", i, i); 8259566063dSJacob Faibussowitsch PetscCall(MatShift(bA->m[i][i], a)); 8269566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bA->m[i][i], &subnnzstate)); 82706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i * bA->nc + i] != subnnzstate); 82806a1af2fSStefano Zampini bA->nnzstate[i * bA->nc + i] = subnnzstate; 829a061e289SJed Brown } 83006a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 8313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 832a061e289SJed Brown } 833a061e289SJed Brown 834d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDiagonalSet_Nest(Mat A, Vec D, InsertMode is) 835d71ae5a4SJacob Faibussowitsch { 83613135bc6SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data; 83713135bc6SAlex Fikl PetscInt i; 83806a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 83913135bc6SAlex Fikl 84013135bc6SAlex Fikl PetscFunctionBegin; 84113135bc6SAlex Fikl for (i = 0; i < bA->nr; i++) { 84206a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 84313135bc6SAlex Fikl Vec bv; 8449566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(D, bA->isglobal.row[i], &bv)); 84513135bc6SAlex Fikl if (bA->m[i][i]) { 8469566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet(bA->m[i][i], bv, is)); 8479566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bA->m[i][i], &subnnzstate)); 84813135bc6SAlex Fikl } 8499566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(D, bA->isglobal.row[i], &bv)); 85006a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i * bA->nc + i] != subnnzstate); 85106a1af2fSStefano Zampini bA->nnzstate[i * bA->nc + i] = subnnzstate; 85213135bc6SAlex Fikl } 85306a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 8543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 85513135bc6SAlex Fikl } 85613135bc6SAlex Fikl 857d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_Nest(Mat A, PetscRandom rctx) 858d71ae5a4SJacob Faibussowitsch { 859f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data; 860f8170845SAlex Fikl PetscInt i, j; 861f8170845SAlex Fikl 862f8170845SAlex Fikl PetscFunctionBegin; 863f8170845SAlex Fikl for (i = 0; i < bA->nr; i++) { 864f8170845SAlex Fikl for (j = 0; j < bA->nc; j++) { 86548a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatSetRandom(bA->m[i][j], rctx)); 866f8170845SAlex Fikl } 867f8170845SAlex Fikl } 8683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 869f8170845SAlex Fikl } 870f8170845SAlex Fikl 871d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCreateVecs_Nest(Mat A, Vec *right, Vec *left) 872d71ae5a4SJacob Faibussowitsch { 873d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 874d8588912SDave May Vec *L, *R; 875d8588912SDave May MPI_Comm comm; 876d8588912SDave May PetscInt i, j; 877d8588912SDave May 878d8588912SDave May PetscFunctionBegin; 8799566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)A, &comm)); 880d8588912SDave May if (right) { 881d8588912SDave May /* allocate R */ 8829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bA->nc, &R)); 883d8588912SDave May /* Create the right vectors */ 884d8588912SDave May for (j = 0; j < bA->nc; j++) { 885d8588912SDave May for (i = 0; i < bA->nr; i++) { 886d8588912SDave May if (bA->m[i][j]) { 8879566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(bA->m[i][j], &R[j], NULL)); 888d8588912SDave May break; 889d8588912SDave May } 890d8588912SDave May } 89108401ef6SPierre Jolivet PetscCheck(i != bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column."); 892d8588912SDave May } 8939566063dSJacob Faibussowitsch PetscCall(VecCreateNest(comm, bA->nc, bA->isglobal.col, R, right)); 894d8588912SDave May /* hand back control to the nest vector */ 89548a46eb9SPierre Jolivet for (j = 0; j < bA->nc; j++) PetscCall(VecDestroy(&R[j])); 8969566063dSJacob Faibussowitsch PetscCall(PetscFree(R)); 897d8588912SDave May } 898d8588912SDave May 899d8588912SDave May if (left) { 900d8588912SDave May /* allocate L */ 9019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bA->nr, &L)); 902d8588912SDave May /* Create the left vectors */ 903d8588912SDave May for (i = 0; i < bA->nr; i++) { 904d8588912SDave May for (j = 0; j < bA->nc; j++) { 905d8588912SDave May if (bA->m[i][j]) { 9069566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(bA->m[i][j], NULL, &L[i])); 907d8588912SDave May break; 908d8588912SDave May } 909d8588912SDave May } 91008401ef6SPierre Jolivet PetscCheck(j != bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row."); 911d8588912SDave May } 912d8588912SDave May 9139566063dSJacob Faibussowitsch PetscCall(VecCreateNest(comm, bA->nr, bA->isglobal.row, L, left)); 91448a46eb9SPierre Jolivet for (i = 0; i < bA->nr; i++) PetscCall(VecDestroy(&L[i])); 915d8588912SDave May 9169566063dSJacob Faibussowitsch PetscCall(PetscFree(L)); 917d8588912SDave May } 9183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 919d8588912SDave May } 920d8588912SDave May 921d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_Nest(Mat A, PetscViewer viewer) 922d71ae5a4SJacob Faibussowitsch { 923d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 92429e60adbSStefano Zampini PetscBool isascii, viewSub = PETSC_FALSE; 925d8588912SDave May PetscInt i, j; 926d8588912SDave May 927d8588912SDave May PetscFunctionBegin; 9289566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii)); 929d8588912SDave May if (isascii) { 9309566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)A)->options, ((PetscObject)A)->prefix, "-mat_view_nest_sub", &viewSub, NULL)); 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "Matrix object:\n")); 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushTab(viewer)); 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "type=nest, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT "\n", bA->nr, bA->nc)); 934d8588912SDave May 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "MatNest structure:\n")); 936d8588912SDave May for (i = 0; i < bA->nr; i++) { 937d8588912SDave May for (j = 0; j < bA->nc; j++) { 93819fd82e9SBarry Smith MatType type; 939270f95d7SJed Brown char name[256] = "", prefix[256] = ""; 940d8588912SDave May PetscInt NR, NC; 941d8588912SDave May PetscBool isNest = PETSC_FALSE; 942d8588912SDave May 943d8588912SDave May if (!bA->m[i][j]) { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : NULL\n", i, j)); 945d8588912SDave May continue; 946d8588912SDave May } 9479566063dSJacob Faibussowitsch PetscCall(MatGetSize(bA->m[i][j], &NR, &NC)); 9489566063dSJacob Faibussowitsch PetscCall(MatGetType(bA->m[i][j], &type)); 9499566063dSJacob Faibussowitsch if (((PetscObject)bA->m[i][j])->name) PetscCall(PetscSNPrintf(name, sizeof(name), "name=\"%s\", ", ((PetscObject)bA->m[i][j])->name)); 9509566063dSJacob Faibussowitsch if (((PetscObject)bA->m[i][j])->prefix) PetscCall(PetscSNPrintf(prefix, sizeof(prefix), "prefix=\"%s\", ", ((PetscObject)bA->m[i][j])->prefix)); 9519566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)bA->m[i][j], MATNEST, &isNest)); 952d8588912SDave May 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : %s%stype=%s, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT "\n", i, j, name, prefix, type, NR, NC)); 954d8588912SDave May 95529e60adbSStefano Zampini if (isNest || viewSub) { 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushTab(viewer)); /* push1 */ 9579566063dSJacob Faibussowitsch PetscCall(MatView(bA->m[i][j], viewer)); 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopTab(viewer)); /* pop1 */ 959d8588912SDave May } 960d8588912SDave May } 961d8588912SDave May } 9629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopTab(viewer)); /* pop0 */ 963d8588912SDave May } 9643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 965d8588912SDave May } 966d8588912SDave May 967d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_Nest(Mat A) 968d71ae5a4SJacob Faibussowitsch { 969d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 970d8588912SDave May PetscInt i, j; 971d8588912SDave May 972d8588912SDave May PetscFunctionBegin; 973d8588912SDave May for (i = 0; i < bA->nr; i++) { 974d8588912SDave May for (j = 0; j < bA->nc; j++) { 975d8588912SDave May if (!bA->m[i][j]) continue; 9769566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(bA->m[i][j])); 977d8588912SDave May } 978d8588912SDave May } 9793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 980d8588912SDave May } 981d8588912SDave May 982d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_Nest(Mat A, Mat B, MatStructure str) 983d71ae5a4SJacob Faibussowitsch { 984c222c20dSDavid Ham Mat_Nest *bA = (Mat_Nest *)A->data, *bB = (Mat_Nest *)B->data; 985c222c20dSDavid Ham PetscInt i, j, nr = bA->nr, nc = bA->nc; 98606a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 987c222c20dSDavid Ham 988c222c20dSDavid Ham PetscFunctionBegin; 989aed4548fSBarry Smith PetscCheck(nr == bB->nr && nc == bB->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Cannot copy a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") to a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")", bB->nr, bB->nc, nr, nc); 990c222c20dSDavid Ham for (i = 0; i < nr; i++) { 991c222c20dSDavid Ham for (j = 0; j < nc; j++) { 99206a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 99346a2b97cSJed Brown if (bA->m[i][j] && bB->m[i][j]) { 9949566063dSJacob Faibussowitsch PetscCall(MatCopy(bA->m[i][j], bB->m[i][j], str)); 99508401ef6SPierre Jolivet } else PetscCheck(!bA->m[i][j] && !bB->m[i][j], PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT, i, j); 9969566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bB->m[i][j], &subnnzstate)); 99706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i * nc + j] != subnnzstate); 99806a1af2fSStefano Zampini bB->nnzstate[i * nc + j] = subnnzstate; 999c222c20dSDavid Ham } 1000c222c20dSDavid Ham } 100106a1af2fSStefano Zampini if (nnzstate) B->nonzerostate++; 10023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1003c222c20dSDavid Ham } 1004c222c20dSDavid Ham 1005d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_Nest(Mat Y, PetscScalar a, Mat X, MatStructure str) 1006d71ae5a4SJacob Faibussowitsch { 10076e76ffeaSPierre Jolivet Mat_Nest *bY = (Mat_Nest *)Y->data, *bX = (Mat_Nest *)X->data; 10086e76ffeaSPierre Jolivet PetscInt i, j, nr = bY->nr, nc = bY->nc; 100906a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 10106e76ffeaSPierre Jolivet 10116e76ffeaSPierre Jolivet PetscFunctionBegin; 1012aed4548fSBarry Smith PetscCheck(nr == bX->nr && nc == bX->nc, PetscObjectComm((PetscObject)Y), PETSC_ERR_ARG_INCOMP, "Cannot AXPY a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") with a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")", bX->nr, bX->nc, nr, nc); 10136e76ffeaSPierre Jolivet for (i = 0; i < nr; i++) { 10146e76ffeaSPierre Jolivet for (j = 0; j < nc; j++) { 101506a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 10166e76ffeaSPierre Jolivet if (bY->m[i][j] && bX->m[i][j]) { 10179566063dSJacob Faibussowitsch PetscCall(MatAXPY(bY->m[i][j], a, bX->m[i][j], str)); 1018c066aebcSStefano Zampini } else if (bX->m[i][j]) { 1019c066aebcSStefano Zampini Mat M; 1020c066aebcSStefano Zampini 1021e75569e9SPierre Jolivet PetscCheck(str == DIFFERENT_NONZERO_PATTERN || str == UNKNOWN_NONZERO_PATTERN, PetscObjectComm((PetscObject)Y), PETSC_ERR_ARG_INCOMP, "Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT ". Use DIFFERENT_NONZERO_PATTERN or UNKNOWN_NONZERO_PATTERN", i, j); 10229566063dSJacob Faibussowitsch PetscCall(MatDuplicate(bX->m[i][j], MAT_COPY_VALUES, &M)); 10239566063dSJacob Faibussowitsch PetscCall(MatNestSetSubMat(Y, i, j, M)); 10249566063dSJacob Faibussowitsch PetscCall(MatDestroy(&M)); 1025c066aebcSStefano Zampini } 10269566063dSJacob Faibussowitsch if (bY->m[i][j]) PetscCall(MatGetNonzeroState(bY->m[i][j], &subnnzstate)); 102706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i * nc + j] != subnnzstate); 102806a1af2fSStefano Zampini bY->nnzstate[i * nc + j] = subnnzstate; 10296e76ffeaSPierre Jolivet } 10306e76ffeaSPierre Jolivet } 103106a1af2fSStefano Zampini if (nnzstate) Y->nonzerostate++; 10323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10336e76ffeaSPierre Jolivet } 10346e76ffeaSPierre Jolivet 1035d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDuplicate_Nest(Mat A, MatDuplicateOption op, Mat *B) 1036d71ae5a4SJacob Faibussowitsch { 1037d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 1038841e96a3SJed Brown Mat *b; 1039841e96a3SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 1040d8588912SDave May 1041d8588912SDave May PetscFunctionBegin; 10429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr * nc, &b)); 1043841e96a3SJed Brown for (i = 0; i < nr; i++) { 1044841e96a3SJed Brown for (j = 0; j < nc; j++) { 1045841e96a3SJed Brown if (bA->m[i][j]) { 10469566063dSJacob Faibussowitsch PetscCall(MatDuplicate(bA->m[i][j], op, &b[i * nc + j])); 1047841e96a3SJed Brown } else { 10480298fd71SBarry Smith b[i * nc + j] = NULL; 1049d8588912SDave May } 1050d8588912SDave May } 1051d8588912SDave May } 10529566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nr, bA->isglobal.row, nc, bA->isglobal.col, b, B)); 1053841e96a3SJed Brown /* Give the new MatNest exclusive ownership */ 105448a46eb9SPierre Jolivet for (i = 0; i < nr * nc; i++) PetscCall(MatDestroy(&b[i])); 10559566063dSJacob Faibussowitsch PetscCall(PetscFree(b)); 1056d8588912SDave May 10579566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 10589566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 10593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1060d8588912SDave May } 1061d8588912SDave May 1062d8588912SDave May /* nest api */ 106366976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSubMat_Nest(Mat A, PetscInt idxm, PetscInt jdxm, Mat *mat) 1064d71ae5a4SJacob Faibussowitsch { 1065d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 10665fd66863SKarl Rupp 1067d8588912SDave May PetscFunctionBegin; 106808401ef6SPierre Jolivet PetscCheck(idxm < bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, idxm, bA->nr - 1); 106908401ef6SPierre Jolivet PetscCheck(jdxm < bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT, jdxm, bA->nc - 1); 1070d8588912SDave May *mat = bA->m[idxm][jdxm]; 10713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1072d8588912SDave May } 1073d8588912SDave May 10749ba0d327SJed Brown /*@ 107511a5261eSBarry Smith MatNestGetSubMat - Returns a single, sub-matrix from a `MATNEST` 1076d8588912SDave May 10772ef1f0ffSBarry Smith Not Collective 1078d8588912SDave May 1079d8588912SDave May Input Parameters: 108011a5261eSBarry Smith + A - `MATNEST` matrix 1081d8588912SDave May . idxm - index of the matrix within the nest matrix 1082629881c0SJed Brown - jdxm - index of the matrix within the nest matrix 1083d8588912SDave May 1084d8588912SDave May Output Parameter: 10852ef1f0ffSBarry Smith . sub - matrix at index `idxm`, `jdxm` within the nest matrix 1086d8588912SDave May 1087d8588912SDave May Level: developer 1088d8588912SDave May 1089fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSize()`, `MatNestGetSubMats()`, `MatCreateNest()`, `MatNestSetSubMat()`, 1090db781477SPatrick Sanan `MatNestGetLocalISs()`, `MatNestGetISs()` 1091d8588912SDave May @*/ 1092d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSubMat(Mat A, PetscInt idxm, PetscInt jdxm, Mat *sub) 1093d71ae5a4SJacob Faibussowitsch { 1094d8588912SDave May PetscFunctionBegin; 10953536838dSStefano Zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 10963536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, idxm, 2); 10973536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, jdxm, 3); 10983536838dSStefano Zampini PetscAssertPointer(sub, 4); 1099cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSubMat_C", (Mat, PetscInt, PetscInt, Mat *), (A, idxm, jdxm, sub)); 11003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1101d8588912SDave May } 1102d8588912SDave May 110366976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetSubMat_Nest(Mat A, PetscInt idxm, PetscInt jdxm, Mat mat) 1104d71ae5a4SJacob Faibussowitsch { 11050782ca92SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 11060782ca92SJed Brown PetscInt m, n, M, N, mi, ni, Mi, Ni; 11070782ca92SJed Brown 11080782ca92SJed Brown PetscFunctionBegin; 110908401ef6SPierre Jolivet PetscCheck(idxm < bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, idxm, bA->nr - 1); 111008401ef6SPierre Jolivet PetscCheck(jdxm < bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT, jdxm, bA->nc - 1); 11113536838dSStefano Zampini if (mat) { 11129566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(mat, &m, &n)); 11139566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 11149566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[idxm], &mi)); 11159566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[idxm], &Mi)); 11169566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[jdxm], &ni)); 11179566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[jdxm], &Ni)); 1118aed4548fSBarry Smith PetscCheck(M == Mi && N == Ni, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_INCOMP, "Submatrix dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")", M, N, Mi, Ni); 1119aed4548fSBarry Smith PetscCheck(m == mi && n == ni, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_INCOMP, "Submatrix local dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")", m, n, mi, ni); 11203536838dSStefano Zampini } 112126fbe8dcSKarl Rupp 112206a1af2fSStefano Zampini /* do not increase object state */ 11233ba16761SJacob Faibussowitsch if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(PETSC_SUCCESS); 112406a1af2fSStefano Zampini 11259566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)mat)); 11269566063dSJacob Faibussowitsch PetscCall(MatDestroy(&bA->m[idxm][jdxm])); 11270782ca92SJed Brown bA->m[idxm][jdxm] = mat; 11289566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 11293536838dSStefano Zampini if (mat) PetscCall(MatGetNonzeroState(mat, &bA->nnzstate[idxm * bA->nc + jdxm])); 11303536838dSStefano Zampini else bA->nnzstate[idxm * bA->nc + jdxm] = 0; 113106a1af2fSStefano Zampini A->nonzerostate++; 11323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11330782ca92SJed Brown } 11340782ca92SJed Brown 11359ba0d327SJed Brown /*@ 113611a5261eSBarry Smith MatNestSetSubMat - Set a single submatrix in the `MATNEST` 11370782ca92SJed Brown 11382ef1f0ffSBarry Smith Logically Collective 11390782ca92SJed Brown 11400782ca92SJed Brown Input Parameters: 114111a5261eSBarry Smith + A - `MATNEST` matrix 11420782ca92SJed Brown . idxm - index of the matrix within the nest matrix 11430782ca92SJed Brown . jdxm - index of the matrix within the nest matrix 11442ef1f0ffSBarry Smith - sub - matrix at index `idxm`, `jdxm` within the nest matrix 11452ef1f0ffSBarry Smith 11462ef1f0ffSBarry Smith Level: developer 11470782ca92SJed Brown 11480782ca92SJed Brown Notes: 11490782ca92SJed Brown The new submatrix must have the same size and communicator as that block of the nest. 11500782ca92SJed Brown 11510782ca92SJed Brown This increments the reference count of the submatrix. 11520782ca92SJed Brown 1153fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestSetSubMats()`, `MatNestGetSubMats()`, `MatNestGetLocalISs()`, `MatCreateNest()`, 1154db781477SPatrick Sanan `MatNestGetSubMat()`, `MatNestGetISs()`, `MatNestGetSize()` 11550782ca92SJed Brown @*/ 1156d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetSubMat(Mat A, PetscInt idxm, PetscInt jdxm, Mat sub) 1157d71ae5a4SJacob Faibussowitsch { 11580782ca92SJed Brown PetscFunctionBegin; 11593536838dSStefano Zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 11603536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, idxm, 2); 11613536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, jdxm, 3); 11623536838dSStefano Zampini if (sub) PetscValidHeaderSpecific(sub, MAT_CLASSID, 4); 11633536838dSStefano Zampini PetscTryMethod(A, "MatNestSetSubMat_C", (Mat, PetscInt, PetscInt, Mat), (A, idxm, jdxm, sub)); 11643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11650782ca92SJed Brown } 11660782ca92SJed Brown 116766976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSubMats_Nest(Mat A, PetscInt *M, PetscInt *N, Mat ***mat) 1168d71ae5a4SJacob Faibussowitsch { 1169d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 11705fd66863SKarl Rupp 1171d8588912SDave May PetscFunctionBegin; 117226fbe8dcSKarl Rupp if (M) *M = bA->nr; 117326fbe8dcSKarl Rupp if (N) *N = bA->nc; 117426fbe8dcSKarl Rupp if (mat) *mat = bA->m; 11753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1176d8588912SDave May } 1177d8588912SDave May 1178d8588912SDave May /*@C 117911a5261eSBarry Smith MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a `MATNEST` matrix. 1180d8588912SDave May 11812ef1f0ffSBarry Smith Not Collective 1182d8588912SDave May 1183f899ff85SJose E. Roman Input Parameter: 1184629881c0SJed Brown . A - nest matrix 1185d8588912SDave May 1186d8d19677SJose E. Roman Output Parameters: 1187*a3b724e8SBarry Smith + M - number of submatrix rows in the nest matrix 1188*a3b724e8SBarry Smith . N - number of submatrix columns in the nest matrix 1189e9d3347aSJose E. Roman - mat - array of matrices 1190d8588912SDave May 11912ef1f0ffSBarry Smith Level: developer 11922ef1f0ffSBarry Smith 119311a5261eSBarry Smith Note: 11942ef1f0ffSBarry Smith The user should not free the array `mat`. 1195d8588912SDave May 1196fe59aa6dSJacob Faibussowitsch Fortran Notes: 1197*a3b724e8SBarry Smith This routine has a calling sequence `call MatNestGetSubMats(A, M, N, mat, ierr)` 119820f4b53cSBarry Smith where the space allocated for the optional argument `mat` is assumed large enough (if provided). 1199e9d3347aSJose E. Roman Matrices in `mat` are returned in row-major order, see `MatCreateNest()` for an example. 1200351962e3SVincent Le Chenadec 1201fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSize()`, `MatNestGetSubMat()`, `MatNestGetLocalISs()`, `MatCreateNest()`, 1202db781477SPatrick Sanan `MatNestSetSubMats()`, `MatNestGetISs()`, `MatNestSetSubMat()` 1203d8588912SDave May @*/ 1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSubMats(Mat A, PetscInt *M, PetscInt *N, Mat ***mat) 1205d71ae5a4SJacob Faibussowitsch { 1206d8588912SDave May PetscFunctionBegin; 12073536838dSStefano Zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1208cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSubMats_C", (Mat, PetscInt *, PetscInt *, Mat ***), (A, M, N, mat)); 12093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1210d8588912SDave May } 1211d8588912SDave May 121266976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSize_Nest(Mat A, PetscInt *M, PetscInt *N) 1213d71ae5a4SJacob Faibussowitsch { 1214d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 1215d8588912SDave May 1216d8588912SDave May PetscFunctionBegin; 121726fbe8dcSKarl Rupp if (M) *M = bA->nr; 121826fbe8dcSKarl Rupp if (N) *N = bA->nc; 12193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1220d8588912SDave May } 1221d8588912SDave May 12229ba0d327SJed Brown /*@ 122311a5261eSBarry Smith MatNestGetSize - Returns the size of the `MATNEST` matrix. 1224d8588912SDave May 12252ef1f0ffSBarry Smith Not Collective 1226d8588912SDave May 1227f899ff85SJose E. Roman Input Parameter: 122811a5261eSBarry Smith . A - `MATNEST` matrix 1229d8588912SDave May 1230d8d19677SJose E. Roman Output Parameters: 1231629881c0SJed Brown + M - number of rows in the nested mat 1232629881c0SJed Brown - N - number of cols in the nested mat 1233d8588912SDave May 1234d8588912SDave May Level: developer 1235d8588912SDave May 1236fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatCreateNest()`, `MatNestGetLocalISs()`, 1237db781477SPatrick Sanan `MatNestGetISs()` 1238d8588912SDave May @*/ 1239d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSize(Mat A, PetscInt *M, PetscInt *N) 1240d71ae5a4SJacob Faibussowitsch { 1241d8588912SDave May PetscFunctionBegin; 12423536838dSStefano Zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1243cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSize_C", (Mat, PetscInt *, PetscInt *), (A, M, N)); 12443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1245d8588912SDave May } 1246d8588912SDave May 1247d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetISs_Nest(Mat A, IS rows[], IS cols[]) 1248d71ae5a4SJacob Faibussowitsch { 1249900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 1250900e7ff2SJed Brown PetscInt i; 1251900e7ff2SJed Brown 1252900e7ff2SJed Brown PetscFunctionBegin; 12539371c9d4SSatish Balay if (rows) 12549371c9d4SSatish Balay for (i = 0; i < vs->nr; i++) rows[i] = vs->isglobal.row[i]; 12559371c9d4SSatish Balay if (cols) 12569371c9d4SSatish Balay for (i = 0; i < vs->nc; i++) cols[i] = vs->isglobal.col[i]; 12573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1258900e7ff2SJed Brown } 1259900e7ff2SJed Brown 12603a4d7b9aSSatish Balay /*@C 126111a5261eSBarry Smith MatNestGetISs - Returns the index sets partitioning the row and column spaces of a `MATNEST` 1262900e7ff2SJed Brown 12632ef1f0ffSBarry Smith Not Collective 1264900e7ff2SJed Brown 1265f899ff85SJose E. Roman Input Parameter: 126611a5261eSBarry Smith . A - `MATNEST` matrix 1267900e7ff2SJed Brown 1268d8d19677SJose E. Roman Output Parameters: 1269*a3b724e8SBarry Smith + rows - array of row index sets (pass `NULL` to ignore) 1270*a3b724e8SBarry Smith - cols - array of column index sets (pass `NULL` to ignore) 1271900e7ff2SJed Brown 1272900e7ff2SJed Brown Level: advanced 1273900e7ff2SJed Brown 127411a5261eSBarry Smith Note: 12752ef1f0ffSBarry Smith The user must have allocated arrays of the correct size. The reference count is not increased on the returned `IS`s. 1276900e7ff2SJed Brown 1277fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatNestGetSize()`, `MatNestGetLocalISs()`, 1278fe59aa6dSJacob Faibussowitsch `MatCreateNest()`, `MatNestSetSubMats()` 1279900e7ff2SJed Brown @*/ 1280d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetISs(Mat A, IS rows[], IS cols[]) 1281d71ae5a4SJacob Faibussowitsch { 1282900e7ff2SJed Brown PetscFunctionBegin; 1283900e7ff2SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1284cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetISs_C", (Mat, IS[], IS[]), (A, rows, cols)); 12853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1286900e7ff2SJed Brown } 1287900e7ff2SJed Brown 1288d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetLocalISs_Nest(Mat A, IS rows[], IS cols[]) 1289d71ae5a4SJacob Faibussowitsch { 1290900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 1291900e7ff2SJed Brown PetscInt i; 1292900e7ff2SJed Brown 1293900e7ff2SJed Brown PetscFunctionBegin; 12949371c9d4SSatish Balay if (rows) 12959371c9d4SSatish Balay for (i = 0; i < vs->nr; i++) rows[i] = vs->islocal.row[i]; 12969371c9d4SSatish Balay if (cols) 12979371c9d4SSatish Balay for (i = 0; i < vs->nc; i++) cols[i] = vs->islocal.col[i]; 12983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1299900e7ff2SJed Brown } 1300900e7ff2SJed Brown 1301900e7ff2SJed Brown /*@C 130211a5261eSBarry Smith MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces of a `MATNEST` 1303900e7ff2SJed Brown 13042ef1f0ffSBarry Smith Not Collective 1305900e7ff2SJed Brown 1306f899ff85SJose E. Roman Input Parameter: 130711a5261eSBarry Smith . A - `MATNEST` matrix 1308900e7ff2SJed Brown 1309d8d19677SJose E. Roman Output Parameters: 1310*a3b724e8SBarry Smith + rows - array of row index sets (pass `NULL` to ignore) 1311*a3b724e8SBarry Smith - cols - array of column index sets (pass `NULL` to ignore) 1312900e7ff2SJed Brown 1313900e7ff2SJed Brown Level: advanced 1314900e7ff2SJed Brown 131511a5261eSBarry Smith Note: 13162ef1f0ffSBarry Smith The user must have allocated arrays of the correct size. The reference count is not increased on the returned `IS`s. 1317900e7ff2SJed Brown 13181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatNestGetSize()`, `MatNestGetISs()`, `MatCreateNest()`, 1319fe59aa6dSJacob Faibussowitsch `MatNestSetSubMats()`, `MatNestSetSubMat()` 1320900e7ff2SJed Brown @*/ 1321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetLocalISs(Mat A, IS rows[], IS cols[]) 1322d71ae5a4SJacob Faibussowitsch { 1323900e7ff2SJed Brown PetscFunctionBegin; 1324900e7ff2SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1325cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetLocalISs_C", (Mat, IS[], IS[]), (A, rows, cols)); 13263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1327900e7ff2SJed Brown } 1328900e7ff2SJed Brown 132966976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetVecType_Nest(Mat A, VecType vtype) 1330d71ae5a4SJacob Faibussowitsch { 1331207556f9SJed Brown PetscBool flg; 1332207556f9SJed Brown 1333207556f9SJed Brown PetscFunctionBegin; 13349566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, VECNEST, &flg)); 1335207556f9SJed Brown /* In reality, this only distinguishes VECNEST and "other" */ 13362a7a6963SBarry Smith if (flg) A->ops->getvecs = MatCreateVecs_Nest; 133712b53f24SSatish Balay else A->ops->getvecs = (PetscErrorCode(*)(Mat, Vec *, Vec *))0; 13383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1339207556f9SJed Brown } 1340207556f9SJed Brown 1341207556f9SJed Brown /*@C 134211a5261eSBarry Smith MatNestSetVecType - Sets the type of `Vec` returned by `MatCreateVecs()` 1343207556f9SJed Brown 13442ef1f0ffSBarry Smith Not Collective 1345207556f9SJed Brown 1346207556f9SJed Brown Input Parameters: 134711a5261eSBarry Smith + A - `MATNEST` matrix 134811a5261eSBarry Smith - vtype - `VecType` to use for creating vectors 1349207556f9SJed Brown 1350207556f9SJed Brown Level: developer 1351207556f9SJed Brown 1352fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreateVecs()`, `MatCreateNest()`, `VecType` 1353207556f9SJed Brown @*/ 1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetVecType(Mat A, VecType vtype) 1355d71ae5a4SJacob Faibussowitsch { 1356207556f9SJed Brown PetscFunctionBegin; 13573536838dSStefano Zampini PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1358cac4c232SBarry Smith PetscTryMethod(A, "MatNestSetVecType_C", (Mat, VecType), (A, vtype)); 13593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1360207556f9SJed Brown } 1361207556f9SJed Brown 136266976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetSubMats_Nest(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[]) 1363d71ae5a4SJacob Faibussowitsch { 1364c8883902SJed Brown Mat_Nest *s = (Mat_Nest *)A->data; 1365c8883902SJed Brown PetscInt i, j, m, n, M, N; 136688ffe2e8SJose E. Roman PetscBool cong, isstd, sametype = PETSC_FALSE; 136788ffe2e8SJose E. Roman VecType vtype, type; 1368d8588912SDave May 1369d8588912SDave May PetscFunctionBegin; 13709566063dSJacob Faibussowitsch PetscCall(MatReset_Nest(A)); 137106a1af2fSStefano Zampini 1372c8883902SJed Brown s->nr = nr; 1373c8883902SJed Brown s->nc = nc; 1374d8588912SDave May 1375c8883902SJed Brown /* Create space for submatrices */ 13769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &s->m)); 13778068ee9dSPierre Jolivet PetscCall(PetscMalloc1(nr * nc, &s->m[0])); 1378c8883902SJed Brown for (i = 0; i < nr; i++) { 13798068ee9dSPierre Jolivet s->m[i] = s->m[0] + i * nc; 1380c8883902SJed Brown for (j = 0; j < nc; j++) { 13813536838dSStefano Zampini s->m[i][j] = a ? a[i * nc + j] : NULL; 13823536838dSStefano Zampini PetscCall(PetscObjectReference((PetscObject)s->m[i][j])); 1383d8588912SDave May } 1384d8588912SDave May } 13859566063dSJacob Faibussowitsch PetscCall(MatGetVecType(A, &vtype)); 13869566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, VECSTANDARD, &isstd)); 138788ffe2e8SJose E. Roman if (isstd) { 138888ffe2e8SJose E. Roman /* check if all blocks have the same vectype */ 138988ffe2e8SJose E. Roman vtype = NULL; 139088ffe2e8SJose E. Roman for (i = 0; i < nr; i++) { 139188ffe2e8SJose E. Roman for (j = 0; j < nc; j++) { 13923536838dSStefano Zampini if (s->m[i][j]) { 139388ffe2e8SJose E. Roman if (!vtype) { /* first visited block */ 13943536838dSStefano Zampini PetscCall(MatGetVecType(s->m[i][j], &vtype)); 139588ffe2e8SJose E. Roman sametype = PETSC_TRUE; 139688ffe2e8SJose E. Roman } else if (sametype) { 13973536838dSStefano Zampini PetscCall(MatGetVecType(s->m[i][j], &type)); 13989566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, type, &sametype)); 139988ffe2e8SJose E. Roman } 140088ffe2e8SJose E. Roman } 140188ffe2e8SJose E. Roman } 140288ffe2e8SJose E. Roman } 140388ffe2e8SJose E. Roman if (sametype) { /* propagate vectype */ 14049566063dSJacob Faibussowitsch PetscCall(MatSetVecType(A, vtype)); 140588ffe2e8SJose E. Roman } 140688ffe2e8SJose E. Roman } 1407d8588912SDave May 14089566063dSJacob Faibussowitsch PetscCall(MatSetUp_NestIS_Private(A, nr, is_row, nc, is_col)); 1409d8588912SDave May 14109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &s->row_len)); 14119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nc, &s->col_len)); 1412c8883902SJed Brown for (i = 0; i < nr; i++) s->row_len[i] = -1; 1413c8883902SJed Brown for (j = 0; j < nc; j++) s->col_len[j] = -1; 1414d8588912SDave May 14159566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr * nc, &s->nnzstate)); 141606a1af2fSStefano Zampini for (i = 0; i < nr; i++) { 141706a1af2fSStefano Zampini for (j = 0; j < nc; j++) { 141848a46eb9SPierre Jolivet if (s->m[i][j]) PetscCall(MatGetNonzeroState(s->m[i][j], &s->nnzstate[i * nc + j])); 141906a1af2fSStefano Zampini } 142006a1af2fSStefano Zampini } 142106a1af2fSStefano Zampini 14229566063dSJacob Faibussowitsch PetscCall(MatNestGetSizes_Private(A, &m, &n, &M, &N)); 1423d8588912SDave May 14249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetSize(A->rmap, M)); 14259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(A->rmap, m)); 14269566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetSize(A->cmap, N)); 14279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(A->cmap, n)); 1428c8883902SJed Brown 14299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 14309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1431c8883902SJed Brown 143206a1af2fSStefano Zampini /* disable operations that are not supported for non-square matrices, 143306a1af2fSStefano Zampini or matrices for which is_row != is_col */ 14349566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong)); 143506a1af2fSStefano Zampini if (cong && nr != nc) cong = PETSC_FALSE; 143606a1af2fSStefano Zampini if (cong) { 143748a46eb9SPierre Jolivet for (i = 0; cong && i < nr; i++) PetscCall(ISEqualUnsorted(s->isglobal.row[i], s->isglobal.col[i], &cong)); 143806a1af2fSStefano Zampini } 143906a1af2fSStefano Zampini if (!cong) { 1440381b8e50SStefano Zampini A->ops->missingdiagonal = NULL; 144106a1af2fSStefano Zampini A->ops->getdiagonal = NULL; 144206a1af2fSStefano Zampini A->ops->shift = NULL; 144306a1af2fSStefano Zampini A->ops->diagonalset = NULL; 144406a1af2fSStefano Zampini } 144506a1af2fSStefano Zampini 14469566063dSJacob Faibussowitsch PetscCall(PetscCalloc2(nr, &s->left, nc, &s->right)); 14479566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 144806a1af2fSStefano Zampini A->nonzerostate++; 14493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1450d8588912SDave May } 1451d8588912SDave May 1452c8883902SJed Brown /*@ 145311a5261eSBarry Smith MatNestSetSubMats - Sets the nested submatrices in a `MATNEST` 1454c8883902SJed Brown 1455c3339decSBarry Smith Collective 1456c8883902SJed Brown 1457d8d19677SJose E. Roman Input Parameters: 145811a5261eSBarry Smith + A - `MATNEST` matrix 1459c8883902SJed Brown . nr - number of nested row blocks 14602ef1f0ffSBarry Smith . is_row - index sets for each nested row block, or `NULL` to make contiguous 1461c8883902SJed Brown . nc - number of nested column blocks 14622ef1f0ffSBarry Smith . is_col - index sets for each nested column block, or `NULL` to make contiguous 14633536838dSStefano Zampini - a - array of nr*nc submatrices, or `NULL` 14642ef1f0ffSBarry Smith 14652ef1f0ffSBarry Smith Level: advanced 1466c8883902SJed Brown 1467e9d3347aSJose E. Roman Notes: 14683536838dSStefano Zampini This always resets any block matrix information previously set. 1469d8b4a066SPierre Jolivet Pass `NULL` in the corresponding entry of `a` for an empty block. 147006a1af2fSStefano Zampini 1471e9d3347aSJose E. Roman In both C and Fortran, `a` must be a row-major order array containing the matrices. See 1472e9d3347aSJose E. Roman `MatCreateNest()` for an example. 1473e9d3347aSJose E. Roman 14741cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreateNest()`, `MatNestSetSubMat()`, `MatNestGetSubMat()`, `MatNestGetSubMats()` 1475c8883902SJed Brown @*/ 1476d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetSubMats(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[]) 1477d71ae5a4SJacob Faibussowitsch { 1478c8883902SJed Brown PetscFunctionBegin; 1479c8883902SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 14803536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, nr, 2); 148108401ef6SPierre Jolivet PetscCheck(nr >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Number of rows cannot be negative"); 1482c8883902SJed Brown if (nr && is_row) { 14834f572ea9SToby Isaac PetscAssertPointer(is_row, 3); 14843536838dSStefano Zampini for (PetscInt i = 0; i < nr; i++) PetscValidHeaderSpecific(is_row[i], IS_CLASSID, 3); 1485c8883902SJed Brown } 14863536838dSStefano Zampini PetscValidLogicalCollectiveInt(A, nc, 4); 148708401ef6SPierre Jolivet PetscCheck(nc >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Number of columns cannot be negative"); 14881664e352SJed Brown if (nc && is_col) { 14894f572ea9SToby Isaac PetscAssertPointer(is_col, 5); 14903536838dSStefano Zampini for (PetscInt i = 0; i < nc; i++) PetscValidHeaderSpecific(is_col[i], IS_CLASSID, 5); 1491c8883902SJed Brown } 14923536838dSStefano Zampini PetscTryMethod(A, "MatNestSetSubMats_C", (Mat, PetscInt, const IS[], PetscInt, const IS[], const Mat[]), (A, nr, is_row, nc, is_col, a)); 14933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1494c8883902SJed Brown } 1495d8588912SDave May 1496d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A, PetscInt n, const IS islocal[], const IS isglobal[], PetscBool colflg, ISLocalToGlobalMapping *ltog) 1497d71ae5a4SJacob Faibussowitsch { 149877019fcaSJed Brown PetscBool flg; 149977019fcaSJed Brown PetscInt i, j, m, mi, *ix; 150077019fcaSJed Brown 150177019fcaSJed Brown PetscFunctionBegin; 1502aea6d515SStefano Zampini *ltog = NULL; 150377019fcaSJed Brown for (i = 0, m = 0, flg = PETSC_FALSE; i < n; i++) { 150477019fcaSJed Brown if (islocal[i]) { 15059566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(islocal[i], &mi)); 150677019fcaSJed Brown flg = PETSC_TRUE; /* We found a non-trivial entry */ 150777019fcaSJed Brown } else { 15089566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mi)); 150977019fcaSJed Brown } 151077019fcaSJed Brown m += mi; 151177019fcaSJed Brown } 15123ba16761SJacob Faibussowitsch if (!flg) PetscFunctionReturn(PETSC_SUCCESS); 1513aea6d515SStefano Zampini 15149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ix)); 1515165cd838SBarry Smith for (i = 0, m = 0; i < n; i++) { 15160298fd71SBarry Smith ISLocalToGlobalMapping smap = NULL; 1517e108cb99SStefano Zampini Mat sub = NULL; 1518f6d38dbbSStefano Zampini PetscSF sf; 1519f6d38dbbSStefano Zampini PetscLayout map; 1520aea6d515SStefano Zampini const PetscInt *ix2; 152177019fcaSJed Brown 1522165cd838SBarry Smith if (!colflg) { 15239566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 152477019fcaSJed Brown } else { 15259566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, i, &sub)); 152677019fcaSJed Brown } 1527191fd14bSBarry Smith if (sub) { 1528191fd14bSBarry Smith if (!colflg) { 15299566063dSJacob Faibussowitsch PetscCall(MatGetLocalToGlobalMapping(sub, &smap, NULL)); 1530191fd14bSBarry Smith } else { 15319566063dSJacob Faibussowitsch PetscCall(MatGetLocalToGlobalMapping(sub, NULL, &smap)); 1532191fd14bSBarry Smith } 1533191fd14bSBarry Smith } 153477019fcaSJed Brown /* 153577019fcaSJed Brown Now we need to extract the monolithic global indices that correspond to the given split global indices. 153677019fcaSJed Brown In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces. 153777019fcaSJed Brown */ 15389566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isglobal[i], &ix2)); 1539aea6d515SStefano Zampini if (islocal[i]) { 1540aea6d515SStefano Zampini PetscInt *ilocal, *iremote; 1541aea6d515SStefano Zampini PetscInt mil, nleaves; 1542aea6d515SStefano Zampini 15439566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(islocal[i], &mi)); 154428b400f6SJacob Faibussowitsch PetscCheck(smap, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing local to global map"); 1545aea6d515SStefano Zampini for (j = 0; j < mi; j++) ix[m + j] = j; 15469566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingApply(smap, mi, ix + m, ix + m)); 1547aea6d515SStefano Zampini 1548aea6d515SStefano Zampini /* PetscSFSetGraphLayout does not like negative indices */ 15499566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mi, &ilocal, mi, &iremote)); 1550aea6d515SStefano Zampini for (j = 0, nleaves = 0; j < mi; j++) { 1551aea6d515SStefano Zampini if (ix[m + j] < 0) continue; 1552aea6d515SStefano Zampini ilocal[nleaves] = j; 1553aea6d515SStefano Zampini iremote[nleaves] = ix[m + j]; 1554aea6d515SStefano Zampini nleaves++; 1555aea6d515SStefano Zampini } 15569566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mil)); 15579566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PetscObjectComm((PetscObject)A), &sf)); 15589566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreate(PetscObjectComm((PetscObject)A), &map)); 15599566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(map, mil)); 15609566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 15619566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraphLayout(sf, map, nleaves, ilocal, PETSC_USE_POINTER, iremote)); 15629566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&map)); 15639566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sf, MPIU_INT, ix2, ix + m, MPI_REPLACE)); 15649566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sf, MPIU_INT, ix2, ix + m, MPI_REPLACE)); 15659566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sf)); 15669566063dSJacob Faibussowitsch PetscCall(PetscFree2(ilocal, iremote)); 1567aea6d515SStefano Zampini } else { 15689566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mi)); 1569aea6d515SStefano Zampini for (j = 0; j < mi; j++) ix[m + j] = ix2[i]; 1570aea6d515SStefano Zampini } 15719566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isglobal[i], &ix2)); 157277019fcaSJed Brown m += mi; 157377019fcaSJed Brown } 15749566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A), 1, m, ix, PETSC_OWN_POINTER, ltog)); 15753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 157677019fcaSJed Brown } 157777019fcaSJed Brown 1578d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */ 1579d8588912SDave May /* 1580d8588912SDave May nprocessors = NP 1581d8588912SDave May Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1)) 1582d8588912SDave May proc 0: => (g_0,h_0,) 1583d8588912SDave May proc 1: => (g_1,h_1,) 1584d8588912SDave May ... 1585d8588912SDave May proc nprocs-1: => (g_NP-1,h_NP-1,) 1586d8588912SDave May 1587d8588912SDave May proc 0: proc 1: proc nprocs-1: 1588d8588912SDave May is[0] = (0,1,2,...,nlocal(g_0)-1) (0,1,...,nlocal(g_1)-1) (0,1,...,nlocal(g_NP-1)) 1589d8588912SDave May 1590d8588912SDave May proc 0: 1591d8588912SDave May is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1) 1592d8588912SDave May proc 1: 1593d8588912SDave May is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1) 1594d8588912SDave May 1595d8588912SDave May proc NP-1: 1596d8588912SDave May is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1) 1597d8588912SDave May */ 1598d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_NestIS_Private(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[]) 1599d71ae5a4SJacob Faibussowitsch { 1600e2d7f03fSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 16018188e55aSJed Brown PetscInt i, j, offset, n, nsum, bs; 16020298fd71SBarry Smith Mat sub = NULL; 1603d8588912SDave May 1604d8588912SDave May PetscFunctionBegin; 16059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &vs->isglobal.row)); 16069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nc, &vs->isglobal.col)); 1607d8588912SDave May if (is_row) { /* valid IS is passed in */ 1608a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1609e2d7f03fSJed Brown for (i = 0; i < vs->nr; i++) { 16109566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)is_row[i])); 161126fbe8dcSKarl Rupp 1612e2d7f03fSJed Brown vs->isglobal.row[i] = is_row[i]; 1613d8588912SDave May } 16142ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each row */ 16158188e55aSJed Brown nsum = 0; 16168188e55aSJed Brown for (i = 0; i < vs->nr; i++) { /* Add up the local sizes to compute the aggregate offset */ 16179566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 161828b400f6SJacob Faibussowitsch PetscCheck(sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "No nonzero submatrix in row %" PetscInt_FMT, i); 16199566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, &n, NULL)); 162008401ef6SPierre Jolivet PetscCheck(n >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Sizes have not yet been set for submatrix"); 16218188e55aSJed Brown nsum += n; 16228188e55aSJed Brown } 16239566063dSJacob Faibussowitsch PetscCallMPI(MPI_Scan(&nsum, &offset, 1, MPIU_INT, MPI_SUM, PetscObjectComm((PetscObject)A))); 162430bc264bSJed Brown offset -= nsum; 1625e2d7f03fSJed Brown for (i = 0; i < vs->nr; i++) { 16269566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 16279566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, &n, NULL)); 16289566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, &bs, NULL)); 16299566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PetscObjectComm((PetscObject)sub), n, offset, 1, &vs->isglobal.row[i])); 16309566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(vs->isglobal.row[i], bs)); 16312ae74bdbSJed Brown offset += n; 1632d8588912SDave May } 1633d8588912SDave May } 1634d8588912SDave May 1635d8588912SDave May if (is_col) { /* valid IS is passed in */ 1636a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1637e2d7f03fSJed Brown for (j = 0; j < vs->nc; j++) { 16389566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)is_col[j])); 163926fbe8dcSKarl Rupp 1640e2d7f03fSJed Brown vs->isglobal.col[j] = is_col[j]; 1641d8588912SDave May } 16422ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each column */ 16432ae74bdbSJed Brown offset = A->cmap->rstart; 16448188e55aSJed Brown nsum = 0; 16458188e55aSJed Brown for (j = 0; j < vs->nc; j++) { 16469566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, j, &sub)); 164728b400f6SJacob Faibussowitsch PetscCheck(sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "No nonzero submatrix in column %" PetscInt_FMT, i); 16489566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, NULL, &n)); 164908401ef6SPierre Jolivet PetscCheck(n >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Sizes have not yet been set for submatrix"); 16508188e55aSJed Brown nsum += n; 16518188e55aSJed Brown } 16529566063dSJacob Faibussowitsch PetscCallMPI(MPI_Scan(&nsum, &offset, 1, MPIU_INT, MPI_SUM, PetscObjectComm((PetscObject)A))); 165330bc264bSJed Brown offset -= nsum; 1654e2d7f03fSJed Brown for (j = 0; j < vs->nc; j++) { 16559566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, j, &sub)); 16569566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, NULL, &n)); 16579566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, NULL, &bs)); 16589566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PetscObjectComm((PetscObject)sub), n, offset, 1, &vs->isglobal.col[j])); 16599566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(vs->isglobal.col[j], bs)); 16602ae74bdbSJed Brown offset += n; 1661d8588912SDave May } 1662d8588912SDave May } 1663e2d7f03fSJed Brown 1664e2d7f03fSJed Brown /* Set up the local ISs */ 16659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(vs->nr, &vs->islocal.row)); 16669566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(vs->nc, &vs->islocal.col)); 1667e2d7f03fSJed Brown for (i = 0, offset = 0; i < vs->nr; i++) { 1668e2d7f03fSJed Brown IS isloc; 16690298fd71SBarry Smith ISLocalToGlobalMapping rmap = NULL; 1670e2d7f03fSJed Brown PetscInt nlocal, bs; 16719566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 16729566063dSJacob Faibussowitsch if (sub) PetscCall(MatGetLocalToGlobalMapping(sub, &rmap, NULL)); 1673207556f9SJed Brown if (rmap) { 16749566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, &bs, NULL)); 16759566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingGetSize(rmap, &nlocal)); 16769566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, nlocal, offset, 1, &isloc)); 16779566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isloc, bs)); 1678207556f9SJed Brown } else { 1679207556f9SJed Brown nlocal = 0; 16800298fd71SBarry Smith isloc = NULL; 1681207556f9SJed Brown } 1682e2d7f03fSJed Brown vs->islocal.row[i] = isloc; 1683e2d7f03fSJed Brown offset += nlocal; 1684e2d7f03fSJed Brown } 16858188e55aSJed Brown for (i = 0, offset = 0; i < vs->nc; i++) { 1686e2d7f03fSJed Brown IS isloc; 16870298fd71SBarry Smith ISLocalToGlobalMapping cmap = NULL; 1688e2d7f03fSJed Brown PetscInt nlocal, bs; 16899566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, i, &sub)); 16909566063dSJacob Faibussowitsch if (sub) PetscCall(MatGetLocalToGlobalMapping(sub, NULL, &cmap)); 1691207556f9SJed Brown if (cmap) { 16929566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, NULL, &bs)); 16939566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingGetSize(cmap, &nlocal)); 16949566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, nlocal, offset, 1, &isloc)); 16959566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isloc, bs)); 1696207556f9SJed Brown } else { 1697207556f9SJed Brown nlocal = 0; 16980298fd71SBarry Smith isloc = NULL; 1699207556f9SJed Brown } 1700e2d7f03fSJed Brown vs->islocal.col[i] = isloc; 1701e2d7f03fSJed Brown offset += nlocal; 1702e2d7f03fSJed Brown } 17030189643fSJed Brown 170477019fcaSJed Brown /* Set up the aggregate ISLocalToGlobalMapping */ 170577019fcaSJed Brown { 170645b6f7e9SBarry Smith ISLocalToGlobalMapping rmap, cmap; 17079566063dSJacob Faibussowitsch PetscCall(MatNestCreateAggregateL2G_Private(A, vs->nr, vs->islocal.row, vs->isglobal.row, PETSC_FALSE, &rmap)); 17089566063dSJacob Faibussowitsch PetscCall(MatNestCreateAggregateL2G_Private(A, vs->nc, vs->islocal.col, vs->isglobal.col, PETSC_TRUE, &cmap)); 17099566063dSJacob Faibussowitsch if (rmap && cmap) PetscCall(MatSetLocalToGlobalMapping(A, rmap, cmap)); 17109566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rmap)); 17119566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cmap)); 171277019fcaSJed Brown } 171377019fcaSJed Brown 171476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 17150189643fSJed Brown for (i = 0; i < vs->nr; i++) { 17160189643fSJed Brown for (j = 0; j < vs->nc; j++) { 17170189643fSJed Brown PetscInt m, n, M, N, mi, ni, Mi, Ni; 17180189643fSJed Brown Mat B = vs->m[i][j]; 17190189643fSJed Brown if (!B) continue; 17209566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &M, &N)); 17219566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(B, &m, &n)); 17229566063dSJacob Faibussowitsch PetscCall(ISGetSize(vs->isglobal.row[i], &Mi)); 17239566063dSJacob Faibussowitsch PetscCall(ISGetSize(vs->isglobal.col[j], &Ni)); 17249566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.row[i], &mi)); 17259566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.col[j], &ni)); 1726aed4548fSBarry Smith PetscCheck(M == Mi && N == Ni, PetscObjectComm((PetscObject)sub), PETSC_ERR_ARG_INCOMP, "Global sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")", M, N, i, j, Mi, Ni); 1727aed4548fSBarry Smith PetscCheck(m == mi && n == ni, PetscObjectComm((PetscObject)sub), PETSC_ERR_ARG_INCOMP, "Local sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")", m, n, i, j, mi, ni); 17280189643fSJed Brown } 17290189643fSJed Brown } 173076bd3646SJed Brown } 1731a061e289SJed Brown 1732a061e289SJed Brown /* Set A->assembled if all non-null blocks are currently assembled */ 1733a061e289SJed Brown for (i = 0; i < vs->nr; i++) { 1734a061e289SJed Brown for (j = 0; j < vs->nc; j++) { 17353ba16761SJacob Faibussowitsch if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(PETSC_SUCCESS); 1736a061e289SJed Brown } 1737a061e289SJed Brown } 1738a061e289SJed Brown A->assembled = PETSC_TRUE; 17393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1740d8588912SDave May } 1741d8588912SDave May 174245c38901SJed Brown /*@C 174311a5261eSBarry Smith MatCreateNest - Creates a new `MATNEST` matrix containing several nested submatrices, each stored separately 1744659c6bb0SJed Brown 174511a5261eSBarry Smith Collective 1746659c6bb0SJed Brown 1747d8d19677SJose E. Roman Input Parameters: 174811a5261eSBarry Smith + comm - Communicator for the new `MATNEST` 1749659c6bb0SJed Brown . nr - number of nested row blocks 17502ef1f0ffSBarry Smith . is_row - index sets for each nested row block, or `NULL` to make contiguous 1751659c6bb0SJed Brown . nc - number of nested column blocks 17522ef1f0ffSBarry Smith . is_col - index sets for each nested column block, or `NULL` to make contiguous 1753e9d3347aSJose E. Roman - a - array of nr*nc submatrices, empty submatrices can be passed using `NULL` 1754659c6bb0SJed Brown 1755659c6bb0SJed Brown Output Parameter: 1756659c6bb0SJed Brown . B - new matrix 1757659c6bb0SJed Brown 1758e9d3347aSJose E. Roman Note: 1759e9d3347aSJose E. Roman In both C and Fortran, `a` must be a row-major order array holding references to the matrices. 1760e9d3347aSJose E. Roman For instance, to represent the matrix 1761e9d3347aSJose E. Roman $\begin{bmatrix} A_{11} & A_{12} \\ A_{21} & A_{22}\end{bmatrix}$ 1762e9d3347aSJose E. Roman one should use `Mat a[4]={A11,A12,A21,A22}`. 1763e9d3347aSJose E. Roman 1764659c6bb0SJed Brown Level: advanced 1765659c6bb0SJed Brown 17661cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreate()`, `VecCreateNest()`, `DMCreateMatrix()`, `MatNestSetSubMat()`, 1767db781477SPatrick Sanan `MatNestGetSubMat()`, `MatNestGetLocalISs()`, `MatNestGetSize()`, 1768db781477SPatrick Sanan `MatNestGetISs()`, `MatNestSetSubMats()`, `MatNestGetSubMats()` 1769659c6bb0SJed Brown @*/ 1770d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateNest(MPI_Comm comm, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[], Mat *B) 1771d71ae5a4SJacob Faibussowitsch { 1772d8588912SDave May PetscFunctionBegin; 17733536838dSStefano Zampini PetscCall(MatCreate(comm, B)); 17743536838dSStefano Zampini PetscCall(MatSetType(*B, MATNEST)); 17753536838dSStefano Zampini (*B)->preallocated = PETSC_TRUE; 17763536838dSStefano Zampini PetscCall(MatNestSetSubMats(*B, nr, is_row, nc, is_col, a)); 17773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1778d8588912SDave May } 1779659c6bb0SJed Brown 178066976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 1781d71ae5a4SJacob Faibussowitsch { 1782b68353e5Sstefano_zampini Mat_Nest *nest = (Mat_Nest *)A->data; 178323875855Sstefano_zampini Mat *trans; 1784b68353e5Sstefano_zampini PetscScalar **avv; 1785b68353e5Sstefano_zampini PetscScalar *vv; 1786b68353e5Sstefano_zampini PetscInt **aii, **ajj; 1787b68353e5Sstefano_zampini PetscInt *ii, *jj, *ci; 1788b68353e5Sstefano_zampini PetscInt nr, nc, nnz, i, j; 1789b68353e5Sstefano_zampini PetscBool done; 1790b68353e5Sstefano_zampini 1791b68353e5Sstefano_zampini PetscFunctionBegin; 17929566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &nr, &nc)); 1793b68353e5Sstefano_zampini if (reuse == MAT_REUSE_MATRIX) { 1794b68353e5Sstefano_zampini PetscInt rnr; 1795b68353e5Sstefano_zampini 17969566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(*newmat, 0, PETSC_FALSE, PETSC_FALSE, &rnr, (const PetscInt **)&ii, (const PetscInt **)&jj, &done)); 179728b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "MatGetRowIJ"); 179808401ef6SPierre Jolivet PetscCheck(rnr == nr, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "Cannot reuse matrix, wrong number of rows"); 17999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*newmat, &vv)); 1800b68353e5Sstefano_zampini } 1801b68353e5Sstefano_zampini /* extract CSR for nested SeqAIJ matrices */ 1802b68353e5Sstefano_zampini nnz = 0; 18039566063dSJacob Faibussowitsch PetscCall(PetscCalloc4(nest->nr * nest->nc, &aii, nest->nr * nest->nc, &ajj, nest->nr * nest->nc, &avv, nest->nr * nest->nc, &trans)); 1804b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1805b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1806b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1807b68353e5Sstefano_zampini if (B) { 1808b68353e5Sstefano_zampini PetscScalar *naa; 1809b68353e5Sstefano_zampini PetscInt *nii, *njj, nnr; 181023875855Sstefano_zampini PetscBool istrans; 1811b68353e5Sstefano_zampini 1812013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATTRANSPOSEVIRTUAL, &istrans)); 181323875855Sstefano_zampini if (istrans) { 181423875855Sstefano_zampini Mat Bt; 181523875855Sstefano_zampini 18169566063dSJacob Faibussowitsch PetscCall(MatTransposeGetMat(B, &Bt)); 18179566063dSJacob Faibussowitsch PetscCall(MatTranspose(Bt, MAT_INITIAL_MATRIX, &trans[i * nest->nc + j])); 181823875855Sstefano_zampini B = trans[i * nest->nc + j]; 1819013e2dc7SBarry Smith } else { 1820013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHERMITIANTRANSPOSEVIRTUAL, &istrans)); 1821013e2dc7SBarry Smith if (istrans) { 1822013e2dc7SBarry Smith Mat Bt; 1823013e2dc7SBarry Smith 1824013e2dc7SBarry Smith PetscCall(MatHermitianTransposeGetMat(B, &Bt)); 1825013e2dc7SBarry Smith PetscCall(MatHermitianTranspose(Bt, MAT_INITIAL_MATRIX, &trans[i * nest->nc + j])); 1826013e2dc7SBarry Smith B = trans[i * nest->nc + j]; 1827013e2dc7SBarry Smith } 182823875855Sstefano_zampini } 18299566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(B, 0, PETSC_FALSE, PETSC_FALSE, &nnr, (const PetscInt **)&nii, (const PetscInt **)&njj, &done)); 183028b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)B), PETSC_ERR_PLIB, "MatGetRowIJ"); 18319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(B, &naa)); 1832b68353e5Sstefano_zampini nnz += nii[nnr]; 1833b68353e5Sstefano_zampini 1834b68353e5Sstefano_zampini aii[i * nest->nc + j] = nii; 1835b68353e5Sstefano_zampini ajj[i * nest->nc + j] = njj; 1836b68353e5Sstefano_zampini avv[i * nest->nc + j] = naa; 1837b68353e5Sstefano_zampini } 1838b68353e5Sstefano_zampini } 1839b68353e5Sstefano_zampini } 1840b68353e5Sstefano_zampini if (reuse != MAT_REUSE_MATRIX) { 18419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr + 1, &ii)); 18429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jj)); 18439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &vv)); 1844b68353e5Sstefano_zampini } else { 184508401ef6SPierre Jolivet PetscCheck(nnz == ii[nr], PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "Cannot reuse matrix, wrong number of nonzeros"); 1846b68353e5Sstefano_zampini } 1847b68353e5Sstefano_zampini 1848b68353e5Sstefano_zampini /* new row pointer */ 18499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ii, nr + 1)); 1850b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1851b68353e5Sstefano_zampini PetscInt ncr, rst; 1852b68353e5Sstefano_zampini 18539566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &rst, NULL)); 18549566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &ncr)); 1855b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1856b68353e5Sstefano_zampini if (aii[i * nest->nc + j]) { 1857b68353e5Sstefano_zampini PetscInt *nii = aii[i * nest->nc + j]; 1858b68353e5Sstefano_zampini PetscInt ir; 1859b68353e5Sstefano_zampini 1860b68353e5Sstefano_zampini for (ir = rst; ir < ncr + rst; ++ir) { 1861b68353e5Sstefano_zampini ii[ir + 1] += nii[1] - nii[0]; 1862b68353e5Sstefano_zampini nii++; 1863b68353e5Sstefano_zampini } 1864b68353e5Sstefano_zampini } 1865b68353e5Sstefano_zampini } 1866b68353e5Sstefano_zampini } 1867b68353e5Sstefano_zampini for (i = 0; i < nr; i++) ii[i + 1] += ii[i]; 1868b68353e5Sstefano_zampini 1869b68353e5Sstefano_zampini /* construct CSR for the new matrix */ 18709566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr, &ci)); 1871b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1872b68353e5Sstefano_zampini PetscInt ncr, rst; 1873b68353e5Sstefano_zampini 18749566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &rst, NULL)); 18759566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &ncr)); 1876b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1877b68353e5Sstefano_zampini if (aii[i * nest->nc + j]) { 1878b68353e5Sstefano_zampini PetscScalar *nvv = avv[i * nest->nc + j]; 1879b68353e5Sstefano_zampini PetscInt *nii = aii[i * nest->nc + j]; 1880b68353e5Sstefano_zampini PetscInt *njj = ajj[i * nest->nc + j]; 1881b68353e5Sstefano_zampini PetscInt ir, cst; 1882b68353e5Sstefano_zampini 18839566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.col[j], &cst, NULL)); 1884b68353e5Sstefano_zampini for (ir = rst; ir < ncr + rst; ++ir) { 1885b68353e5Sstefano_zampini PetscInt ij, rsize = nii[1] - nii[0], ist = ii[ir] + ci[ir]; 1886b68353e5Sstefano_zampini 1887b68353e5Sstefano_zampini for (ij = 0; ij < rsize; ij++) { 1888b68353e5Sstefano_zampini jj[ist + ij] = *njj + cst; 1889b68353e5Sstefano_zampini vv[ist + ij] = *nvv; 1890b68353e5Sstefano_zampini njj++; 1891b68353e5Sstefano_zampini nvv++; 1892b68353e5Sstefano_zampini } 1893b68353e5Sstefano_zampini ci[ir] += rsize; 1894b68353e5Sstefano_zampini nii++; 1895b68353e5Sstefano_zampini } 1896b68353e5Sstefano_zampini } 1897b68353e5Sstefano_zampini } 1898b68353e5Sstefano_zampini } 18999566063dSJacob Faibussowitsch PetscCall(PetscFree(ci)); 1900b68353e5Sstefano_zampini 1901b68353e5Sstefano_zampini /* restore info */ 1902b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1903b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1904b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1905b68353e5Sstefano_zampini if (B) { 1906b68353e5Sstefano_zampini PetscInt nnr = 0, k = i * nest->nc + j; 190723875855Sstefano_zampini 190823875855Sstefano_zampini B = (trans[k] ? trans[k] : B); 19099566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(B, 0, PETSC_FALSE, PETSC_FALSE, &nnr, (const PetscInt **)&aii[k], (const PetscInt **)&ajj[k], &done)); 191028b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)B), PETSC_ERR_PLIB, "MatRestoreRowIJ"); 19119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(B, &avv[k])); 19129566063dSJacob Faibussowitsch PetscCall(MatDestroy(&trans[k])); 1913b68353e5Sstefano_zampini } 1914b68353e5Sstefano_zampini } 1915b68353e5Sstefano_zampini } 19169566063dSJacob Faibussowitsch PetscCall(PetscFree4(aii, ajj, avv, trans)); 1917b68353e5Sstefano_zampini 1918b68353e5Sstefano_zampini /* finalize newmat */ 1919b68353e5Sstefano_zampini if (reuse == MAT_INITIAL_MATRIX) { 19209566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A), nr, nc, ii, jj, vv, newmat)); 1921b68353e5Sstefano_zampini } else if (reuse == MAT_INPLACE_MATRIX) { 1922b68353e5Sstefano_zampini Mat B; 1923b68353e5Sstefano_zampini 19249566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A), nr, nc, ii, jj, vv, &B)); 19259566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &B)); 1926b68353e5Sstefano_zampini } 19279566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*newmat, MAT_FINAL_ASSEMBLY)); 19289566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*newmat, MAT_FINAL_ASSEMBLY)); 1929b68353e5Sstefano_zampini { 1930b68353e5Sstefano_zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)((*newmat)->data); 1931b68353e5Sstefano_zampini a->free_a = PETSC_TRUE; 1932b68353e5Sstefano_zampini a->free_ij = PETSC_TRUE; 1933b68353e5Sstefano_zampini } 19343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1935b68353e5Sstefano_zampini } 1936b68353e5Sstefano_zampini 1937d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y, PetscScalar a, Mat X) 1938d71ae5a4SJacob Faibussowitsch { 1939be705e3aSPierre Jolivet Mat_Nest *nest = (Mat_Nest *)X->data; 1940be705e3aSPierre Jolivet PetscInt i, j, k, rstart; 1941be705e3aSPierre Jolivet PetscBool flg; 1942be705e3aSPierre Jolivet 1943be705e3aSPierre Jolivet PetscFunctionBegin; 1944be705e3aSPierre Jolivet /* Fill by row */ 1945be705e3aSPierre Jolivet for (j = 0; j < nest->nc; ++j) { 1946be705e3aSPierre Jolivet /* Using global column indices and ISAllGather() is not scalable. */ 1947be705e3aSPierre Jolivet IS bNis; 1948be705e3aSPierre Jolivet PetscInt bN; 1949be705e3aSPierre Jolivet const PetscInt *bNindices; 19509566063dSJacob Faibussowitsch PetscCall(ISAllGather(nest->isglobal.col[j], &bNis)); 19519566063dSJacob Faibussowitsch PetscCall(ISGetSize(bNis, &bN)); 19529566063dSJacob Faibussowitsch PetscCall(ISGetIndices(bNis, &bNindices)); 1953be705e3aSPierre Jolivet for (i = 0; i < nest->nr; ++i) { 1954fd8a7442SPierre Jolivet Mat B = nest->m[i][j], D = NULL; 1955be705e3aSPierre Jolivet PetscInt bm, br; 1956be705e3aSPierre Jolivet const PetscInt *bmindices; 1957be705e3aSPierre Jolivet if (!B) continue; 1958013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATTRANSPOSEVIRTUAL, MATHERMITIANTRANSPOSEVIRTUAL, "")); 1959be705e3aSPierre Jolivet if (flg) { 1960cac4c232SBarry Smith PetscTryMethod(B, "MatTransposeGetMat_C", (Mat, Mat *), (B, &D)); 1961cac4c232SBarry Smith PetscTryMethod(B, "MatHermitianTransposeGetMat_C", (Mat, Mat *), (B, &D)); 19629566063dSJacob Faibussowitsch PetscCall(MatConvert(B, ((PetscObject)D)->type_name, MAT_INITIAL_MATRIX, &D)); 1963be705e3aSPierre Jolivet B = D; 1964be705e3aSPierre Jolivet } 19659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATSEQSBAIJ, MATMPISBAIJ, "")); 1966be705e3aSPierre Jolivet if (flg) { 1967fd8a7442SPierre Jolivet if (D) PetscCall(MatConvert(D, MATBAIJ, MAT_INPLACE_MATRIX, &D)); 1968fd8a7442SPierre Jolivet else PetscCall(MatConvert(B, MATBAIJ, MAT_INITIAL_MATRIX, &D)); 1969be705e3aSPierre Jolivet B = D; 1970be705e3aSPierre Jolivet } 19719566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &bm)); 19729566063dSJacob Faibussowitsch PetscCall(ISGetIndices(nest->isglobal.row[i], &bmindices)); 19739566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(B, &rstart, NULL)); 1974be705e3aSPierre Jolivet for (br = 0; br < bm; ++br) { 1975be705e3aSPierre Jolivet PetscInt row = bmindices[br], brncols, *cols; 1976be705e3aSPierre Jolivet const PetscInt *brcols; 1977be705e3aSPierre Jolivet const PetscScalar *brcoldata; 1978be705e3aSPierre Jolivet PetscScalar *vals = NULL; 19799566063dSJacob Faibussowitsch PetscCall(MatGetRow(B, br + rstart, &brncols, &brcols, &brcoldata)); 19809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(brncols, &cols)); 1981be705e3aSPierre Jolivet for (k = 0; k < brncols; k++) cols[k] = bNindices[brcols[k]]; 1982be705e3aSPierre Jolivet /* 1983be705e3aSPierre Jolivet Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match. 1984be705e3aSPierre Jolivet Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES. 1985be705e3aSPierre Jolivet */ 1986be705e3aSPierre Jolivet if (a != 1.0) { 19879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(brncols, &vals)); 1988be705e3aSPierre Jolivet for (k = 0; k < brncols; k++) vals[k] = a * brcoldata[k]; 19899566063dSJacob Faibussowitsch PetscCall(MatSetValues(Y, 1, &row, brncols, cols, vals, ADD_VALUES)); 19909566063dSJacob Faibussowitsch PetscCall(PetscFree(vals)); 1991be705e3aSPierre Jolivet } else { 19929566063dSJacob Faibussowitsch PetscCall(MatSetValues(Y, 1, &row, brncols, cols, brcoldata, ADD_VALUES)); 1993be705e3aSPierre Jolivet } 19949566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(B, br + rstart, &brncols, &brcols, &brcoldata)); 19959566063dSJacob Faibussowitsch PetscCall(PetscFree(cols)); 1996be705e3aSPierre Jolivet } 1997fd8a7442SPierre Jolivet if (D) PetscCall(MatDestroy(&D)); 19989566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(nest->isglobal.row[i], &bmindices)); 1999be705e3aSPierre Jolivet } 20009566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(bNis, &bNindices)); 20019566063dSJacob Faibussowitsch PetscCall(ISDestroy(&bNis)); 2002be705e3aSPierre Jolivet } 20039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Y, MAT_FINAL_ASSEMBLY)); 20049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Y, MAT_FINAL_ASSEMBLY)); 20053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2006be705e3aSPierre Jolivet } 2007be705e3aSPierre Jolivet 200866976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_AIJ(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 2009d71ae5a4SJacob Faibussowitsch { 2010629c3df2SDmitry Karpeev Mat_Nest *nest = (Mat_Nest *)A->data; 2011e30678d3SPierre Jolivet PetscInt m, n, M, N, i, j, k, *dnnz, *onnz = NULL, rstart, cstart, cend; 2012b68353e5Sstefano_zampini PetscMPIInt size; 2013629c3df2SDmitry Karpeev Mat C; 2014629c3df2SDmitry Karpeev 2015629c3df2SDmitry Karpeev PetscFunctionBegin; 20169566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 2017b68353e5Sstefano_zampini if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */ 2018b68353e5Sstefano_zampini PetscInt nf; 2019b68353e5Sstefano_zampini PetscBool fast; 2020b68353e5Sstefano_zampini 20219566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(newtype, MATAIJ, &fast)); 202248a46eb9SPierre Jolivet if (!fast) PetscCall(PetscStrcmp(newtype, MATSEQAIJ, &fast)); 2023b68353e5Sstefano_zampini for (i = 0; i < nest->nr && fast; ++i) { 2024b68353e5Sstefano_zampini for (j = 0; j < nest->nc && fast; ++j) { 2025b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 2026b68353e5Sstefano_zampini if (B) { 20279566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &fast)); 202823875855Sstefano_zampini if (!fast) { 202923875855Sstefano_zampini PetscBool istrans; 203023875855Sstefano_zampini 2031013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATTRANSPOSEVIRTUAL, &istrans)); 203223875855Sstefano_zampini if (istrans) { 203323875855Sstefano_zampini Mat Bt; 203423875855Sstefano_zampini 20359566063dSJacob Faibussowitsch PetscCall(MatTransposeGetMat(B, &Bt)); 20369566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)Bt, MATSEQAIJ, &fast)); 2037013e2dc7SBarry Smith } else { 2038013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHERMITIANTRANSPOSEVIRTUAL, &istrans)); 2039013e2dc7SBarry Smith if (istrans) { 2040013e2dc7SBarry Smith Mat Bt; 2041013e2dc7SBarry Smith 2042013e2dc7SBarry Smith PetscCall(MatHermitianTransposeGetMat(B, &Bt)); 2043013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)Bt, MATSEQAIJ, &fast)); 2044013e2dc7SBarry Smith } 204523875855Sstefano_zampini } 2046b68353e5Sstefano_zampini } 2047b68353e5Sstefano_zampini } 2048b68353e5Sstefano_zampini } 2049b68353e5Sstefano_zampini } 2050b68353e5Sstefano_zampini for (i = 0, nf = 0; i < nest->nr && fast; ++i) { 20519566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i], ISSTRIDE, &fast)); 2052b68353e5Sstefano_zampini if (fast) { 2053b68353e5Sstefano_zampini PetscInt f, s; 2054b68353e5Sstefano_zampini 20559566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &f, &s)); 20569371c9d4SSatish Balay if (f != nf || s != 1) { 20579371c9d4SSatish Balay fast = PETSC_FALSE; 20589371c9d4SSatish Balay } else { 20599566063dSJacob Faibussowitsch PetscCall(ISGetSize(nest->isglobal.row[i], &f)); 2060b68353e5Sstefano_zampini nf += f; 2061b68353e5Sstefano_zampini } 2062b68353e5Sstefano_zampini } 2063b68353e5Sstefano_zampini } 2064b68353e5Sstefano_zampini for (i = 0, nf = 0; i < nest->nc && fast; ++i) { 20659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i], ISSTRIDE, &fast)); 2066b68353e5Sstefano_zampini if (fast) { 2067b68353e5Sstefano_zampini PetscInt f, s; 2068b68353e5Sstefano_zampini 20699566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.col[i], &f, &s)); 20709371c9d4SSatish Balay if (f != nf || s != 1) { 20719371c9d4SSatish Balay fast = PETSC_FALSE; 20729371c9d4SSatish Balay } else { 20739566063dSJacob Faibussowitsch PetscCall(ISGetSize(nest->isglobal.col[i], &f)); 2074b68353e5Sstefano_zampini nf += f; 2075b68353e5Sstefano_zampini } 2076b68353e5Sstefano_zampini } 2077b68353e5Sstefano_zampini } 2078b68353e5Sstefano_zampini if (fast) { 20799566063dSJacob Faibussowitsch PetscCall(MatConvert_Nest_SeqAIJ_fast(A, newtype, reuse, newmat)); 20803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2081b68353e5Sstefano_zampini } 2082b68353e5Sstefano_zampini } 20839566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, &N)); 20849566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, &n)); 20859566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRangeColumn(A, &cstart, &cend)); 2086d1487292SPierre Jolivet if (reuse == MAT_REUSE_MATRIX) C = *newmat; 2087d1487292SPierre Jolivet else { 20889566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 20899566063dSJacob Faibussowitsch PetscCall(MatSetType(C, newtype)); 20909566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, M, N)); 2091629c3df2SDmitry Karpeev } 20929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * m, &dnnz)); 2093e30678d3SPierre Jolivet if (m) { 2094629c3df2SDmitry Karpeev onnz = dnnz + m; 2095629c3df2SDmitry Karpeev for (k = 0; k < m; k++) { 2096629c3df2SDmitry Karpeev dnnz[k] = 0; 2097629c3df2SDmitry Karpeev onnz[k] = 0; 2098629c3df2SDmitry Karpeev } 2099e30678d3SPierre Jolivet } 2100629c3df2SDmitry Karpeev for (j = 0; j < nest->nc; ++j) { 2101629c3df2SDmitry Karpeev IS bNis; 2102629c3df2SDmitry Karpeev PetscInt bN; 2103629c3df2SDmitry Karpeev const PetscInt *bNindices; 2104fd8a7442SPierre Jolivet PetscBool flg; 2105629c3df2SDmitry Karpeev /* Using global column indices and ISAllGather() is not scalable. */ 21069566063dSJacob Faibussowitsch PetscCall(ISAllGather(nest->isglobal.col[j], &bNis)); 21079566063dSJacob Faibussowitsch PetscCall(ISGetSize(bNis, &bN)); 21089566063dSJacob Faibussowitsch PetscCall(ISGetIndices(bNis, &bNindices)); 2109629c3df2SDmitry Karpeev for (i = 0; i < nest->nr; ++i) { 2110629c3df2SDmitry Karpeev PetscSF bmsf; 2111649b366bSFande Kong PetscSFNode *iremote; 2112fd8a7442SPierre Jolivet Mat B = nest->m[i][j], D = NULL; 2113649b366bSFande Kong PetscInt bm, *sub_dnnz, *sub_onnz, br; 2114629c3df2SDmitry Karpeev const PetscInt *bmindices; 2115629c3df2SDmitry Karpeev if (!B) continue; 21169566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &bm)); 21179566063dSJacob Faibussowitsch PetscCall(ISGetIndices(nest->isglobal.row[i], &bmindices)); 21189566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf)); 21199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &iremote)); 21209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &sub_dnnz)); 21219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &sub_onnz)); 2122649b366bSFande Kong for (k = 0; k < bm; ++k) { 2123649b366bSFande Kong sub_dnnz[k] = 0; 2124649b366bSFande Kong sub_onnz[k] = 0; 2125649b366bSFande Kong } 2126dead4d76SPierre Jolivet PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATTRANSPOSEVIRTUAL, MATHERMITIANTRANSPOSEVIRTUAL, "")); 2127fd8a7442SPierre Jolivet if (flg) { 2128fd8a7442SPierre Jolivet PetscTryMethod(B, "MatTransposeGetMat_C", (Mat, Mat *), (B, &D)); 2129fd8a7442SPierre Jolivet PetscTryMethod(B, "MatHermitianTransposeGetMat_C", (Mat, Mat *), (B, &D)); 2130fd8a7442SPierre Jolivet PetscCall(MatConvert(B, ((PetscObject)D)->type_name, MAT_INITIAL_MATRIX, &D)); 2131fd8a7442SPierre Jolivet B = D; 2132fd8a7442SPierre Jolivet } 2133fd8a7442SPierre Jolivet PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATSEQSBAIJ, MATMPISBAIJ, "")); 2134fd8a7442SPierre Jolivet if (flg) { 2135fd8a7442SPierre Jolivet if (D) PetscCall(MatConvert(D, MATBAIJ, MAT_INPLACE_MATRIX, &D)); 2136fd8a7442SPierre Jolivet else PetscCall(MatConvert(B, MATBAIJ, MAT_INITIAL_MATRIX, &D)); 2137fd8a7442SPierre Jolivet B = D; 2138fd8a7442SPierre Jolivet } 2139629c3df2SDmitry Karpeev /* 2140629c3df2SDmitry Karpeev Locate the owners for all of the locally-owned global row indices for this row block. 2141629c3df2SDmitry Karpeev These determine the roots of PetscSF used to communicate preallocation data to row owners. 2142629c3df2SDmitry Karpeev The roots correspond to the dnnz and onnz entries; thus, there are two roots per row. 2143629c3df2SDmitry Karpeev */ 21449566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(B, &rstart, NULL)); 2145629c3df2SDmitry Karpeev for (br = 0; br < bm; ++br) { 2146131c27b5Sprj- PetscInt row = bmindices[br], brncols, col; 2147629c3df2SDmitry Karpeev const PetscInt *brcols; 2148a4b3d3acSMatthew G Knepley PetscInt rowrel = 0; /* row's relative index on its owner rank */ 2149131c27b5Sprj- PetscMPIInt rowowner = 0; 21509566063dSJacob Faibussowitsch PetscCall(PetscLayoutFindOwnerIndex(A->rmap, row, &rowowner, &rowrel)); 2151649b366bSFande Kong /* how many roots */ 21529371c9d4SSatish Balay iremote[br].rank = rowowner; 21539371c9d4SSatish Balay iremote[br].index = rowrel; /* edge from bmdnnz to dnnz */ 2154649b366bSFande Kong /* get nonzero pattern */ 21559566063dSJacob Faibussowitsch PetscCall(MatGetRow(B, br + rstart, &brncols, &brcols, NULL)); 2156629c3df2SDmitry Karpeev for (k = 0; k < brncols; k++) { 2157629c3df2SDmitry Karpeev col = bNindices[brcols[k]]; 2158649b366bSFande Kong if (col >= A->cmap->range[rowowner] && col < A->cmap->range[rowowner + 1]) { 2159649b366bSFande Kong sub_dnnz[br]++; 2160649b366bSFande Kong } else { 2161649b366bSFande Kong sub_onnz[br]++; 2162649b366bSFande Kong } 2163629c3df2SDmitry Karpeev } 21649566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(B, br + rstart, &brncols, &brcols, NULL)); 2165629c3df2SDmitry Karpeev } 2166fd8a7442SPierre Jolivet if (D) PetscCall(MatDestroy(&D)); 21679566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(nest->isglobal.row[i], &bmindices)); 2168629c3df2SDmitry Karpeev /* bsf will have to take care of disposing of bedges. */ 21699566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraph(bmsf, m, bm, NULL, PETSC_OWN_POINTER, iremote, PETSC_OWN_POINTER)); 21709566063dSJacob Faibussowitsch PetscCall(PetscSFReduceBegin(bmsf, MPIU_INT, sub_dnnz, dnnz, MPI_SUM)); 21719566063dSJacob Faibussowitsch PetscCall(PetscSFReduceEnd(bmsf, MPIU_INT, sub_dnnz, dnnz, MPI_SUM)); 21729566063dSJacob Faibussowitsch PetscCall(PetscSFReduceBegin(bmsf, MPIU_INT, sub_onnz, onnz, MPI_SUM)); 21739566063dSJacob Faibussowitsch PetscCall(PetscSFReduceEnd(bmsf, MPIU_INT, sub_onnz, onnz, MPI_SUM)); 21749566063dSJacob Faibussowitsch PetscCall(PetscFree(sub_dnnz)); 21759566063dSJacob Faibussowitsch PetscCall(PetscFree(sub_onnz)); 21769566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&bmsf)); 2177629c3df2SDmitry Karpeev } 21789566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(bNis, &bNindices)); 21799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&bNis)); 218065a4a0a3Sstefano_zampini } 218165a4a0a3Sstefano_zampini /* Resize preallocation if overestimated */ 218265a4a0a3Sstefano_zampini for (i = 0; i < m; i++) { 218365a4a0a3Sstefano_zampini dnnz[i] = PetscMin(dnnz[i], A->cmap->n); 218465a4a0a3Sstefano_zampini onnz[i] = PetscMin(onnz[i], A->cmap->N - A->cmap->n); 2185629c3df2SDmitry Karpeev } 21869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, dnnz)); 21879566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(C, 0, dnnz, 0, onnz)); 21889566063dSJacob Faibussowitsch PetscCall(PetscFree(dnnz)); 21899566063dSJacob Faibussowitsch PetscCall(MatAXPY_Dense_Nest(C, 1.0, A)); 2190d1487292SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 21919566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &C)); 2192d1487292SPierre Jolivet } else *newmat = C; 21933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2194be705e3aSPierre Jolivet } 2195629c3df2SDmitry Karpeev 219666976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_Dense(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 2197d71ae5a4SJacob Faibussowitsch { 2198629c3df2SDmitry Karpeev Mat B; 2199be705e3aSPierre Jolivet PetscInt m, n, M, N; 2200be705e3aSPierre Jolivet 2201be705e3aSPierre Jolivet PetscFunctionBegin; 22029566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, &N)); 22039566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, &n)); 2204be705e3aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 2205be705e3aSPierre Jolivet B = *newmat; 22069566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(B)); 2207be705e3aSPierre Jolivet } else { 22089566063dSJacob Faibussowitsch PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), m, PETSC_DECIDE, M, N, NULL, &B)); 2209629c3df2SDmitry Karpeev } 22109566063dSJacob Faibussowitsch PetscCall(MatAXPY_Dense_Nest(B, 1.0, A)); 2211be705e3aSPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 22129566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &B)); 2213be705e3aSPierre Jolivet } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B; 22143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2215629c3df2SDmitry Karpeev } 2216629c3df2SDmitry Karpeev 221766976f2fSJacob Faibussowitsch static PetscErrorCode MatHasOperation_Nest(Mat mat, MatOperation op, PetscBool *has) 2218d71ae5a4SJacob Faibussowitsch { 22198b7d3b4bSBarry Smith Mat_Nest *bA = (Mat_Nest *)mat->data; 22203c6db4c4SPierre Jolivet MatOperation opAdd; 22218b7d3b4bSBarry Smith PetscInt i, j, nr = bA->nr, nc = bA->nc; 22228b7d3b4bSBarry Smith PetscBool flg; 22238b7d3b4bSBarry Smith 22244d86920dSPierre Jolivet PetscFunctionBegin; 222552c5f739Sprj- *has = PETSC_FALSE; 22263c6db4c4SPierre Jolivet if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) { 22273c6db4c4SPierre Jolivet opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD); 22288b7d3b4bSBarry Smith for (j = 0; j < nc; j++) { 22298b7d3b4bSBarry Smith for (i = 0; i < nr; i++) { 22308b7d3b4bSBarry Smith if (!bA->m[i][j]) continue; 22319566063dSJacob Faibussowitsch PetscCall(MatHasOperation(bA->m[i][j], opAdd, &flg)); 22323ba16761SJacob Faibussowitsch if (!flg) PetscFunctionReturn(PETSC_SUCCESS); 22338b7d3b4bSBarry Smith } 22348b7d3b4bSBarry Smith } 22358b7d3b4bSBarry Smith } 22363c6db4c4SPierre Jolivet if (((void **)mat->ops)[op]) *has = PETSC_TRUE; 22373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22388b7d3b4bSBarry Smith } 22398b7d3b4bSBarry Smith 2240659c6bb0SJed Brown /*MC 22412ef1f0ffSBarry Smith MATNEST - "nest" - Matrix type consisting of nested submatrices, each stored separately. 2242659c6bb0SJed Brown 2243659c6bb0SJed Brown Level: intermediate 2244659c6bb0SJed Brown 2245659c6bb0SJed Brown Notes: 224611a5261eSBarry Smith This matrix type permits scalable use of `PCFIELDSPLIT` and avoids the large memory costs of extracting submatrices. 2247659c6bb0SJed Brown It allows the use of symmetric and block formats for parts of multi-physics simulations. 224811a5261eSBarry Smith It is usually used with `DMCOMPOSITE` and `DMCreateMatrix()` 2249659c6bb0SJed Brown 22508b7d3b4bSBarry Smith Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero 22518b7d3b4bSBarry Smith rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes 22528b7d3b4bSBarry Smith than the nest matrix. 22538b7d3b4bSBarry Smith 22541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreate()`, `MatType`, `MatCreateNest()`, `MatNestSetSubMat()`, `MatNestGetSubMat()`, 2255db781477SPatrick Sanan `VecCreateNest()`, `DMCreateMatrix()`, `DMCOMPOSITE`, `MatNestSetVecType()`, `MatNestGetLocalISs()`, 2256db781477SPatrick Sanan `MatNestGetISs()`, `MatNestSetSubMats()`, `MatNestGetSubMats()` 2257659c6bb0SJed Brown M*/ 2258d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A) 2259d71ae5a4SJacob Faibussowitsch { 2260c8883902SJed Brown Mat_Nest *s; 2261c8883902SJed Brown 2262c8883902SJed Brown PetscFunctionBegin; 22634dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&s)); 2264c8883902SJed Brown A->data = (void *)s; 2265e7c19651SJed Brown 2266e7c19651SJed Brown s->nr = -1; 2267e7c19651SJed Brown s->nc = -1; 22680298fd71SBarry Smith s->m = NULL; 2269e7c19651SJed Brown s->splitassembly = PETSC_FALSE; 2270c8883902SJed Brown 22719566063dSJacob Faibussowitsch PetscCall(PetscMemzero(A->ops, sizeof(*A->ops))); 227226fbe8dcSKarl Rupp 2273c8883902SJed Brown A->ops->mult = MatMult_Nest; 22749194d70fSJed Brown A->ops->multadd = MatMultAdd_Nest; 2275c8883902SJed Brown A->ops->multtranspose = MatMultTranspose_Nest; 22769194d70fSJed Brown A->ops->multtransposeadd = MatMultTransposeAdd_Nest; 2277f8170845SAlex Fikl A->ops->transpose = MatTranspose_Nest; 22780998551bSBlanca Mellado Pinto A->ops->multhermitiantranspose = MatMultHermitianTranspose_Nest; 22790998551bSBlanca Mellado Pinto A->ops->multhermitiantransposeadd = MatMultHermitianTransposeAdd_Nest; 2280c8883902SJed Brown A->ops->assemblybegin = MatAssemblyBegin_Nest; 2281c8883902SJed Brown A->ops->assemblyend = MatAssemblyEnd_Nest; 2282c8883902SJed Brown A->ops->zeroentries = MatZeroEntries_Nest; 2283c222c20dSDavid Ham A->ops->copy = MatCopy_Nest; 22846e76ffeaSPierre Jolivet A->ops->axpy = MatAXPY_Nest; 2285c8883902SJed Brown A->ops->duplicate = MatDuplicate_Nest; 22867dae84e0SHong Zhang A->ops->createsubmatrix = MatCreateSubMatrix_Nest; 2287c8883902SJed Brown A->ops->destroy = MatDestroy_Nest; 2288c8883902SJed Brown A->ops->view = MatView_Nest; 2289f4259b30SLisandro Dalcin A->ops->getvecs = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */ 2290c8883902SJed Brown A->ops->getlocalsubmatrix = MatGetLocalSubMatrix_Nest; 2291c8883902SJed Brown A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest; 2292429bac76SJed Brown A->ops->getdiagonal = MatGetDiagonal_Nest; 2293429bac76SJed Brown A->ops->diagonalscale = MatDiagonalScale_Nest; 2294a061e289SJed Brown A->ops->scale = MatScale_Nest; 2295a061e289SJed Brown A->ops->shift = MatShift_Nest; 229613135bc6SAlex Fikl A->ops->diagonalset = MatDiagonalSet_Nest; 2297f8170845SAlex Fikl A->ops->setrandom = MatSetRandom_Nest; 22988b7d3b4bSBarry Smith A->ops->hasoperation = MatHasOperation_Nest; 2299381b8e50SStefano Zampini A->ops->missingdiagonal = MatMissingDiagonal_Nest; 2300c8883902SJed Brown 2301f4259b30SLisandro Dalcin A->spptr = NULL; 2302c8883902SJed Brown A->assembled = PETSC_FALSE; 2303c8883902SJed Brown 2304c8883902SJed Brown /* expose Nest api's */ 23059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMat_C", MatNestGetSubMat_Nest)); 23069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMat_C", MatNestSetSubMat_Nest)); 23079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMats_C", MatNestGetSubMats_Nest)); 23089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSize_C", MatNestGetSize_Nest)); 23099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetISs_C", MatNestGetISs_Nest)); 23109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetLocalISs_C", MatNestGetLocalISs_Nest)); 23119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetVecType_C", MatNestSetVecType_Nest)); 23129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMats_C", MatNestSetSubMats_Nest)); 23139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpiaij_C", MatConvert_Nest_AIJ)); 23149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqaij_C", MatConvert_Nest_AIJ)); 23159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_aij_C", MatConvert_Nest_AIJ)); 23169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_is_C", MatConvert_Nest_IS)); 23179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpidense_C", MatConvert_Nest_Dense)); 23189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqdense_C", MatConvert_Nest_Dense)); 23199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_seqdense_C", MatProductSetFromOptions_Nest_Dense)); 23209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_mpidense_C", MatProductSetFromOptions_Nest_Dense)); 2321c8883902SJed Brown 23229566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, MATNEST)); 23233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2324c8883902SJed Brown } 2325