1aaa7dc30SBarry Smith #include <../src/mat/impls/nest/matnestimpl.h> /*I "petscmat.h" I*/ 2b68353e5Sstefano_zampini #include <../src/mat/impls/aij/seq/aij.h> 30c312b8eSJed Brown #include <petscsf.h> 4d8588912SDave May 5c8883902SJed Brown static PetscErrorCode MatSetUp_NestIS_Private(Mat, PetscInt, const IS[], PetscInt, const IS[]); 606a1af2fSStefano Zampini static PetscErrorCode MatCreateVecs_Nest(Mat, Vec *, Vec *); 706a1af2fSStefano Zampini static PetscErrorCode MatReset_Nest(Mat); 806a1af2fSStefano Zampini 95e3038f0Sstefano_zampini PETSC_INTERN PetscErrorCode MatConvert_Nest_IS(Mat, MatType, MatReuse, Mat *); 10c8883902SJed Brown 11d8588912SDave May /* private functions */ 12d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetSizes_Private(Mat A, PetscInt *m, PetscInt *n, PetscInt *M, PetscInt *N) 13d71ae5a4SJacob Faibussowitsch { 14d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 158188e55aSJed Brown PetscInt i, j; 16d8588912SDave May 17d8588912SDave May PetscFunctionBegin; 188188e55aSJed Brown *m = *n = *M = *N = 0; 198188e55aSJed Brown for (i = 0; i < bA->nr; i++) { /* rows */ 208188e55aSJed Brown PetscInt sm, sM; 219566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[i], &sm)); 229566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[i], &sM)); 238188e55aSJed Brown *m += sm; 248188e55aSJed Brown *M += sM; 25d8588912SDave May } 268188e55aSJed Brown for (j = 0; j < bA->nc; j++) { /* cols */ 278188e55aSJed Brown PetscInt sn, sN; 289566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[j], &sn)); 299566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &sN)); 308188e55aSJed Brown *n += sn; 318188e55aSJed Brown *N += sN; 32d8588912SDave May } 333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34d8588912SDave May } 35d8588912SDave May 36d8588912SDave May /* operations */ 37d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMult_Nest(Mat A, Vec x, Vec y) 38d71ae5a4SJacob Faibussowitsch { 39d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 40207556f9SJed Brown Vec *bx = bA->right, *by = bA->left; 41207556f9SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 42d8588912SDave May 43d8588912SDave May PetscFunctionBegin; 449566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(y, bA->isglobal.row[i], &by[i])); 459566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(x, bA->isglobal.col[i], &bx[i])); 46207556f9SJed Brown for (i = 0; i < nr; i++) { 479566063dSJacob Faibussowitsch PetscCall(VecZeroEntries(by[i])); 48207556f9SJed Brown for (j = 0; j < nc; j++) { 49207556f9SJed Brown if (!bA->m[i][j]) continue; 50d8588912SDave May /* y[i] <- y[i] + A[i][j] * x[j] */ 519566063dSJacob Faibussowitsch PetscCall(MatMultAdd(bA->m[i][j], bx[j], by[i], by[i])); 52d8588912SDave May } 53d8588912SDave May } 549566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(y, bA->isglobal.row[i], &by[i])); 559566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.col[i], &bx[i])); 563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 57d8588912SDave May } 58d8588912SDave May 59d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMultAdd_Nest(Mat A, Vec x, Vec y, Vec z) 60d71ae5a4SJacob Faibussowitsch { 619194d70fSJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 629194d70fSJed Brown Vec *bx = bA->right, *bz = bA->left; 639194d70fSJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 649194d70fSJed Brown 659194d70fSJed Brown PetscFunctionBegin; 669566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(z, bA->isglobal.row[i], &bz[i])); 679566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(x, bA->isglobal.col[i], &bx[i])); 689194d70fSJed Brown for (i = 0; i < nr; i++) { 699194d70fSJed Brown if (y != z) { 709194d70fSJed Brown Vec by; 719566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(y, bA->isglobal.row[i], &by)); 729566063dSJacob Faibussowitsch PetscCall(VecCopy(by, bz[i])); 739566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(y, bA->isglobal.row[i], &by)); 749194d70fSJed Brown } 759194d70fSJed Brown for (j = 0; j < nc; j++) { 769194d70fSJed Brown if (!bA->m[i][j]) continue; 779194d70fSJed Brown /* y[i] <- y[i] + A[i][j] * x[j] */ 789566063dSJacob Faibussowitsch PetscCall(MatMultAdd(bA->m[i][j], bx[j], bz[i], bz[i])); 799194d70fSJed Brown } 809194d70fSJed Brown } 819566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(z, bA->isglobal.row[i], &bz[i])); 829566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.col[i], &bx[i])); 833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 849194d70fSJed Brown } 859194d70fSJed Brown 8652c5f739Sprj- typedef struct { 8752c5f739Sprj- Mat *workC; /* array of Mat with specific containers depending on the underlying MatMatMult implementation */ 8852c5f739Sprj- PetscScalar *tarray; /* buffer for storing all temporary products A[i][j] B[j] */ 8952c5f739Sprj- PetscInt *dm, *dn, k; /* displacements and number of submatrices */ 9052c5f739Sprj- } Nest_Dense; 9152c5f739Sprj- 92a678f235SPierre Jolivet static PetscErrorCode MatProductNumeric_Nest_Dense(Mat C) 93d71ae5a4SJacob Faibussowitsch { 946718818eSStefano Zampini Mat_Nest *bA; 9552c5f739Sprj- Nest_Dense *contents; 966718818eSStefano Zampini Mat viewB, viewC, productB, workC; 9752c5f739Sprj- const PetscScalar *barray; 9852c5f739Sprj- PetscScalar *carray; 996718818eSStefano Zampini PetscInt i, j, M, N, nr, nc, ldb, ldc; 1006718818eSStefano Zampini Mat A, B; 10152c5f739Sprj- 10252c5f739Sprj- PetscFunctionBegin; 1030d6f747bSJacob Faibussowitsch MatCheckProduct(C, 1); 1046718818eSStefano Zampini A = C->product->A; 1056718818eSStefano Zampini B = C->product->B; 1069566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 1076718818eSStefano Zampini if (!N) { 1089566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 1099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 1103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1116718818eSStefano Zampini } 1126718818eSStefano Zampini contents = (Nest_Dense *)C->product->data; 11328b400f6SJacob Faibussowitsch PetscCheck(contents, PetscObjectComm((PetscObject)C), PETSC_ERR_PLIB, "Product data empty"); 1146718818eSStefano Zampini bA = (Mat_Nest *)A->data; 1156718818eSStefano Zampini nr = bA->nr; 1166718818eSStefano Zampini nc = bA->nc; 1179566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(B, &ldb)); 1189566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(C, &ldc)); 1199566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 1209566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayRead(B, &barray)); 1219566063dSJacob Faibussowitsch PetscCall(MatDenseGetArray(C, &carray)); 12252c5f739Sprj- for (i = 0; i < nr; i++) { 1239566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[i], &M)); 1248e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dm[i + 1] - contents->dm[i], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset(carray, contents->dm[i]), &viewC)); 1259566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewC, ldc)); 12652c5f739Sprj- for (j = 0; j < nc; j++) { 12752c5f739Sprj- if (!bA->m[i][j]) continue; 1289566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &M)); 1298e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dn[j + 1] - contents->dn[j], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset((PetscScalar *)barray, contents->dn[j]), &viewB)); 1309566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewB, ldb)); 1314222ddf1SHong Zhang 1324222ddf1SHong Zhang /* MatMatMultNumeric(bA->m[i][j],viewB,contents->workC[i*nc + j]); */ 1334222ddf1SHong Zhang workC = contents->workC[i * nc + j]; 1344222ddf1SHong Zhang productB = workC->product->B; 1354222ddf1SHong Zhang workC->product->B = viewB; /* use newly created dense matrix viewB */ 1369566063dSJacob Faibussowitsch PetscCall(MatProductNumeric(workC)); 1379566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewB)); 1384222ddf1SHong Zhang workC->product->B = productB; /* resume original B */ 1394222ddf1SHong Zhang 14052c5f739Sprj- /* C[i] <- workC + C[i] */ 1419566063dSJacob Faibussowitsch PetscCall(MatAXPY(viewC, 1.0, contents->workC[i * nc + j], SAME_NONZERO_PATTERN)); 14252c5f739Sprj- } 1439566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewC)); 14452c5f739Sprj- } 1459566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArray(C, &carray)); 1469566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArrayRead(B, &barray)); 1474222ddf1SHong Zhang 14867af85e8SPierre Jolivet PetscCall(MatSetOption(C, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 1499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 1509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 1513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15252c5f739Sprj- } 15352c5f739Sprj- 15466976f2fSJacob Faibussowitsch static PetscErrorCode MatNest_DenseDestroy(void *ctx) 155d71ae5a4SJacob Faibussowitsch { 15652c5f739Sprj- Nest_Dense *contents = (Nest_Dense *)ctx; 15752c5f739Sprj- PetscInt i; 15852c5f739Sprj- 15952c5f739Sprj- PetscFunctionBegin; 1609566063dSJacob Faibussowitsch PetscCall(PetscFree(contents->tarray)); 16148a46eb9SPierre Jolivet for (i = 0; i < contents->k; i++) PetscCall(MatDestroy(contents->workC + i)); 1629566063dSJacob Faibussowitsch PetscCall(PetscFree3(contents->dm, contents->dn, contents->workC)); 1639566063dSJacob Faibussowitsch PetscCall(PetscFree(contents)); 1643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16552c5f739Sprj- } 16652c5f739Sprj- 167a678f235SPierre Jolivet static PetscErrorCode MatProductSymbolic_Nest_Dense(Mat C) 168d71ae5a4SJacob Faibussowitsch { 1696718818eSStefano Zampini Mat_Nest *bA; 1706718818eSStefano Zampini Mat viewB, workC; 17152c5f739Sprj- const PetscScalar *barray; 1726718818eSStefano Zampini PetscInt i, j, M, N, m, n, nr, nc, maxm = 0, ldb; 1734222ddf1SHong Zhang Nest_Dense *contents = NULL; 1746718818eSStefano Zampini PetscBool cisdense; 1756718818eSStefano Zampini Mat A, B; 1766718818eSStefano Zampini PetscReal fill; 17752c5f739Sprj- 17852c5f739Sprj- PetscFunctionBegin; 1790d6f747bSJacob Faibussowitsch MatCheckProduct(C, 1); 18028b400f6SJacob Faibussowitsch PetscCheck(!C->product->data, PetscObjectComm((PetscObject)C), PETSC_ERR_PLIB, "Product data not empty"); 1816718818eSStefano Zampini A = C->product->A; 1826718818eSStefano Zampini B = C->product->B; 1836718818eSStefano Zampini fill = C->product->fill; 1846718818eSStefano Zampini bA = (Mat_Nest *)A->data; 1856718818eSStefano Zampini nr = bA->nr; 1866718818eSStefano Zampini nc = bA->nc; 1879566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(C, &m, &n)); 1889566063dSJacob Faibussowitsch PetscCall(MatGetSize(C, &M, &N)); 1890572eedcSPierre Jolivet if (m == PETSC_DECIDE || n == PETSC_DECIDE || M == PETSC_DECIDE || N == PETSC_DECIDE) { 1909566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(B, NULL, &n)); 1919566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 1929566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, NULL)); 1939566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, NULL)); 1949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, M, N)); 1950572eedcSPierre Jolivet } 1969566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATMPIDENSE, MATSEQDENSECUDA, MATMPIDENSECUDA, "")); 19748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, ((PetscObject)B)->type_name)); 1989566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 1996718818eSStefano Zampini if (!N) { 2006718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 2013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20252c5f739Sprj- } 20352c5f739Sprj- 2049566063dSJacob Faibussowitsch PetscCall(PetscNew(&contents)); 2056718818eSStefano Zampini C->product->data = contents; 2066718818eSStefano Zampini C->product->destroy = MatNest_DenseDestroy; 2079566063dSJacob Faibussowitsch PetscCall(PetscCalloc3(nr + 1, &contents->dm, nc + 1, &contents->dn, nr * nc, &contents->workC)); 20852c5f739Sprj- contents->k = nr * nc; 20952c5f739Sprj- for (i = 0; i < nr; i++) { 2109566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[i], contents->dm + i + 1)); 21152c5f739Sprj- maxm = PetscMax(maxm, contents->dm[i + 1]); 21252c5f739Sprj- contents->dm[i + 1] += contents->dm[i]; 21352c5f739Sprj- } 21452c5f739Sprj- for (i = 0; i < nc; i++) { 2159566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[i], contents->dn + i + 1)); 21652c5f739Sprj- contents->dn[i + 1] += contents->dn[i]; 21752c5f739Sprj- } 2189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(maxm * N, &contents->tarray)); 2199566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(B, &ldb)); 2209566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, NULL, &N)); 2219566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayRead(B, &barray)); 22252c5f739Sprj- /* loops are permuted compared to MatMatMultNumeric so that viewB is created only once per column of A */ 22352c5f739Sprj- for (j = 0; j < nc; j++) { 2249566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[j], &M)); 2258e3a54c0SPierre Jolivet PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), contents->dn[j + 1] - contents->dn[j], PETSC_DECIDE, M, N, PetscSafePointerPlusOffset((PetscScalar *)barray, contents->dn[j]), &viewB)); 2269566063dSJacob Faibussowitsch PetscCall(MatDenseSetLDA(viewB, ldb)); 22752c5f739Sprj- for (i = 0; i < nr; i++) { 22852c5f739Sprj- if (!bA->m[i][j]) continue; 22952c5f739Sprj- /* MatMatMultSymbolic may attach a specific container (depending on MatType of bA->m[i][j]) to workC[i][j] */ 2304222ddf1SHong Zhang 2319566063dSJacob Faibussowitsch PetscCall(MatProductCreate(bA->m[i][j], viewB, NULL, &contents->workC[i * nc + j])); 2324222ddf1SHong Zhang workC = contents->workC[i * nc + j]; 2339566063dSJacob Faibussowitsch PetscCall(MatProductSetType(workC, MATPRODUCT_AB)); 2349566063dSJacob Faibussowitsch PetscCall(MatProductSetAlgorithm(workC, "default")); 2359566063dSJacob Faibussowitsch PetscCall(MatProductSetFill(workC, fill)); 2369566063dSJacob Faibussowitsch PetscCall(MatProductSetFromOptions(workC)); 2379566063dSJacob Faibussowitsch PetscCall(MatProductSymbolic(workC)); 2384222ddf1SHong Zhang 2396718818eSStefano Zampini /* since tarray will be shared by all Mat */ 2409566063dSJacob Faibussowitsch PetscCall(MatSeqDenseSetPreallocation(workC, contents->tarray)); 2419566063dSJacob Faibussowitsch PetscCall(MatMPIDenseSetPreallocation(workC, contents->tarray)); 24252c5f739Sprj- } 2439566063dSJacob Faibussowitsch PetscCall(MatDestroy(&viewB)); 24452c5f739Sprj- } 2459566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArrayRead(B, &barray)); 24652c5f739Sprj- 2476718818eSStefano Zampini C->ops->productnumeric = MatProductNumeric_Nest_Dense; 2483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24952c5f739Sprj- } 25052c5f739Sprj- 251a678f235SPierre Jolivet static PetscErrorCode MatProductSetFromOptions_Nest_Dense(Mat C) 252d71ae5a4SJacob Faibussowitsch { 2534222ddf1SHong Zhang Mat_Product *product = C->product; 25452c5f739Sprj- 25552c5f739Sprj- PetscFunctionBegin; 256c57d7d18SPierre Jolivet if (product->type == MATPRODUCT_AB) C->ops->productsymbolic = MatProductSymbolic_Nest_Dense; 2573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 25852c5f739Sprj- } 25952c5f739Sprj- 2600998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeKernel_Nest(Mat A, Vec x, Vec y, PetscBool herm) 261d71ae5a4SJacob Faibussowitsch { 262d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 263207556f9SJed Brown Vec *bx = bA->left, *by = bA->right; 264207556f9SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 265d8588912SDave May 266d8588912SDave May PetscFunctionBegin; 2679566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(x, bA->isglobal.row[i], &bx[i])); 2689566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(y, bA->isglobal.col[i], &by[i])); 269207556f9SJed Brown for (j = 0; j < nc; j++) { 2709566063dSJacob Faibussowitsch PetscCall(VecZeroEntries(by[j])); 271609e31cbSJed Brown for (i = 0; i < nr; i++) { 2726c75ac25SJed Brown if (!bA->m[i][j]) continue; 2730998551bSBlanca Mellado Pinto if (herm) PetscCall(MatMultHermitianTransposeAdd(bA->m[i][j], bx[i], by[j], by[j])); /* y[j] <- y[j] + (A[i][j])^H * x[i] */ 2740998551bSBlanca Mellado Pinto else PetscCall(MatMultTransposeAdd(bA->m[i][j], bx[i], by[j], by[j])); /* y[j] <- y[j] + (A[i][j])^T * x[i] */ 275d8588912SDave May } 276d8588912SDave May } 2779566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.row[i], &bx[i])); 2789566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(y, bA->isglobal.col[i], &by[i])); 2793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 280d8588912SDave May } 281d8588912SDave May 2820998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTranspose_Nest(Mat A, Vec x, Vec y) 2830998551bSBlanca Mellado Pinto { 2840998551bSBlanca Mellado Pinto PetscFunctionBegin; 2850998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeKernel_Nest(A, x, y, PETSC_FALSE)); 2860998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 2870998551bSBlanca Mellado Pinto } 2880998551bSBlanca Mellado Pinto 2890998551bSBlanca Mellado Pinto static PetscErrorCode MatMultHermitianTranspose_Nest(Mat A, Vec x, Vec y) 2900998551bSBlanca Mellado Pinto { 2910998551bSBlanca Mellado Pinto PetscFunctionBegin; 2920998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeKernel_Nest(A, x, y, PETSC_TRUE)); 2930998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 2940998551bSBlanca Mellado Pinto } 2950998551bSBlanca Mellado Pinto 2960998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeAddKernel_Nest(Mat A, Vec x, Vec y, Vec z, PetscBool herm) 297d71ae5a4SJacob Faibussowitsch { 2989194d70fSJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 2999194d70fSJed Brown Vec *bx = bA->left, *bz = bA->right; 3009194d70fSJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 3019194d70fSJed Brown 3029194d70fSJed Brown PetscFunctionBegin; 3039566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecGetSubVector(x, bA->isglobal.row[i], &bx[i])); 3049566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecGetSubVector(z, bA->isglobal.col[i], &bz[i])); 3059194d70fSJed Brown for (j = 0; j < nc; j++) { 3069194d70fSJed Brown if (y != z) { 3079194d70fSJed Brown Vec by; 3089566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(y, bA->isglobal.col[j], &by)); 3099566063dSJacob Faibussowitsch PetscCall(VecCopy(by, bz[j])); 3109566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(y, bA->isglobal.col[j], &by)); 3119194d70fSJed Brown } 3129194d70fSJed Brown for (i = 0; i < nr; i++) { 3136c75ac25SJed Brown if (!bA->m[i][j]) continue; 3140998551bSBlanca Mellado Pinto if (herm) PetscCall(MatMultHermitianTransposeAdd(bA->m[i][j], bx[i], bz[j], bz[j])); /* z[j] <- y[j] + (A[i][j])^H * x[i] */ 3150998551bSBlanca Mellado Pinto else PetscCall(MatMultTransposeAdd(bA->m[i][j], bx[i], bz[j], bz[j])); /* z[j] <- y[j] + (A[i][j])^T * x[i] */ 3169194d70fSJed Brown } 3179194d70fSJed Brown } 3189566063dSJacob Faibussowitsch for (i = 0; i < nr; i++) PetscCall(VecRestoreSubVector(x, bA->isglobal.row[i], &bx[i])); 3199566063dSJacob Faibussowitsch for (i = 0; i < nc; i++) PetscCall(VecRestoreSubVector(z, bA->isglobal.col[i], &bz[i])); 3203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3219194d70fSJed Brown } 3229194d70fSJed Brown 3230998551bSBlanca Mellado Pinto static PetscErrorCode MatMultTransposeAdd_Nest(Mat A, Vec x, Vec y, Vec z) 3240998551bSBlanca Mellado Pinto { 3250998551bSBlanca Mellado Pinto PetscFunctionBegin; 3260998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeAddKernel_Nest(A, x, y, z, PETSC_FALSE)); 3270998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 3280998551bSBlanca Mellado Pinto } 3290998551bSBlanca Mellado Pinto 3300998551bSBlanca Mellado Pinto static PetscErrorCode MatMultHermitianTransposeAdd_Nest(Mat A, Vec x, Vec y, Vec z) 3310998551bSBlanca Mellado Pinto { 3320998551bSBlanca Mellado Pinto PetscFunctionBegin; 3330998551bSBlanca Mellado Pinto PetscCall(MatMultTransposeAddKernel_Nest(A, x, y, z, PETSC_TRUE)); 3340998551bSBlanca Mellado Pinto PetscFunctionReturn(PETSC_SUCCESS); 3350998551bSBlanca Mellado Pinto } 3360998551bSBlanca Mellado Pinto 337d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatTranspose_Nest(Mat A, MatReuse reuse, Mat *B) 338d71ae5a4SJacob Faibussowitsch { 339f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data, *bC; 340f8170845SAlex Fikl Mat C; 341f8170845SAlex Fikl PetscInt i, j, nr = bA->nr, nc = bA->nc; 342f8170845SAlex Fikl 343f8170845SAlex Fikl PetscFunctionBegin; 3447fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 345aed4548fSBarry Smith PetscCheck(reuse != MAT_INPLACE_MATRIX || nr == nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_SIZ, "Square nested matrix only for in-place"); 346f8170845SAlex Fikl 347cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_INPLACE_MATRIX) { 348f8170845SAlex Fikl Mat *subs; 349f8170845SAlex Fikl IS *is_row, *is_col; 350f8170845SAlex Fikl 3519566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr * nc, &subs)); 3529566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nr, &is_row, nc, &is_col)); 3539566063dSJacob Faibussowitsch PetscCall(MatNestGetISs(A, is_row, is_col)); 354cf37664fSBarry Smith if (reuse == MAT_INPLACE_MATRIX) { 355ddeb9bd8SAlex Fikl for (i = 0; i < nr; i++) { 356ad540459SPierre Jolivet for (j = 0; j < nc; j++) subs[i + nr * j] = bA->m[i][j]; 357ddeb9bd8SAlex Fikl } 358ddeb9bd8SAlex Fikl } 359ddeb9bd8SAlex Fikl 3609566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nc, is_col, nr, is_row, subs, &C)); 3619566063dSJacob Faibussowitsch PetscCall(PetscFree(subs)); 3629566063dSJacob Faibussowitsch PetscCall(PetscFree2(is_row, is_col)); 363f8170845SAlex Fikl } else { 364f8170845SAlex Fikl C = *B; 365f8170845SAlex Fikl } 366f8170845SAlex Fikl 367f8170845SAlex Fikl bC = (Mat_Nest *)C->data; 368f8170845SAlex Fikl for (i = 0; i < nr; i++) { 369f8170845SAlex Fikl for (j = 0; j < nc; j++) { 370f8170845SAlex Fikl if (bA->m[i][j]) { 371*f4f49eeaSPierre Jolivet PetscCall(MatTranspose(bA->m[i][j], reuse, &bC->m[j][i])); 372f8170845SAlex Fikl } else { 373f8170845SAlex Fikl bC->m[j][i] = NULL; 374f8170845SAlex Fikl } 375f8170845SAlex Fikl } 376f8170845SAlex Fikl } 377f8170845SAlex Fikl 378cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) { 379f8170845SAlex Fikl *B = C; 380f8170845SAlex Fikl } else { 3819566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(A, &C)); 382f8170845SAlex Fikl } 3833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 384f8170845SAlex Fikl } 385f8170845SAlex Fikl 386d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestDestroyISList(PetscInt n, IS **list) 387d71ae5a4SJacob Faibussowitsch { 388e2d7f03fSJed Brown IS *lst = *list; 389e2d7f03fSJed Brown PetscInt i; 390e2d7f03fSJed Brown 391e2d7f03fSJed Brown PetscFunctionBegin; 3923ba16761SJacob Faibussowitsch if (!lst) PetscFunctionReturn(PETSC_SUCCESS); 3939371c9d4SSatish Balay for (i = 0; i < n; i++) 3949371c9d4SSatish Balay if (lst[i]) PetscCall(ISDestroy(&lst[i])); 3959566063dSJacob Faibussowitsch PetscCall(PetscFree(lst)); 3960298fd71SBarry Smith *list = NULL; 3973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 398e2d7f03fSJed Brown } 399e2d7f03fSJed Brown 400d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatReset_Nest(Mat A) 401d71ae5a4SJacob Faibussowitsch { 402d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 403d8588912SDave May PetscInt i, j; 404d8588912SDave May 405d8588912SDave May PetscFunctionBegin; 406d8588912SDave May /* release the matrices and the place holders */ 4079566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nr, &vs->isglobal.row)); 4089566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nc, &vs->isglobal.col)); 4099566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nr, &vs->islocal.row)); 4109566063dSJacob Faibussowitsch PetscCall(MatNestDestroyISList(vs->nc, &vs->islocal.col)); 411d8588912SDave May 4129566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->row_len)); 4139566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->col_len)); 4149566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->nnzstate)); 415d8588912SDave May 4169566063dSJacob Faibussowitsch PetscCall(PetscFree2(vs->left, vs->right)); 417207556f9SJed Brown 418d8588912SDave May /* release the matrices and the place holders */ 419d8588912SDave May if (vs->m) { 420d8588912SDave May for (i = 0; i < vs->nr; i++) { 42148a46eb9SPierre Jolivet for (j = 0; j < vs->nc; j++) PetscCall(MatDestroy(&vs->m[i][j])); 422d8588912SDave May } 4238068ee9dSPierre Jolivet PetscCall(PetscFree(vs->m[0])); 4249566063dSJacob Faibussowitsch PetscCall(PetscFree(vs->m)); 425d8588912SDave May } 42606a1af2fSStefano Zampini 42706a1af2fSStefano Zampini /* restore defaults */ 42806a1af2fSStefano Zampini vs->nr = 0; 42906a1af2fSStefano Zampini vs->nc = 0; 43006a1af2fSStefano Zampini vs->splitassembly = PETSC_FALSE; 4313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 43206a1af2fSStefano Zampini } 43306a1af2fSStefano Zampini 434d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDestroy_Nest(Mat A) 435d71ae5a4SJacob Faibussowitsch { 436362febeeSStefano Zampini PetscFunctionBegin; 4379566063dSJacob Faibussowitsch PetscCall(MatReset_Nest(A)); 4389566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 4399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMat_C", NULL)); 4409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMat_C", NULL)); 4419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMats_C", NULL)); 4429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSize_C", NULL)); 4439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetISs_C", NULL)); 4449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetLocalISs_C", NULL)); 4459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetVecType_C", NULL)); 4469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMats_C", NULL)); 4479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpiaij_C", NULL)); 4489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqaij_C", NULL)); 4499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_aij_C", NULL)); 4509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_is_C", NULL)); 4519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpidense_C", NULL)); 4529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqdense_C", NULL)); 4539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_seqdense_C", NULL)); 4549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_mpidense_C", NULL)); 4553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 456d8588912SDave May } 457d8588912SDave May 458d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_Nest(Mat mat, PetscBool *missing, PetscInt *dd) 459d71ae5a4SJacob Faibussowitsch { 460381b8e50SStefano Zampini Mat_Nest *vs = (Mat_Nest *)mat->data; 461381b8e50SStefano Zampini PetscInt i; 462381b8e50SStefano Zampini 463381b8e50SStefano Zampini PetscFunctionBegin; 464381b8e50SStefano Zampini if (dd) *dd = 0; 465381b8e50SStefano Zampini if (!vs->nr) { 466381b8e50SStefano Zampini *missing = PETSC_TRUE; 4673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 468381b8e50SStefano Zampini } 469381b8e50SStefano Zampini *missing = PETSC_FALSE; 470381b8e50SStefano Zampini for (i = 0; i < vs->nr && !(*missing); i++) { 471381b8e50SStefano Zampini *missing = PETSC_TRUE; 472381b8e50SStefano Zampini if (vs->m[i][i]) { 4739566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal(vs->m[i][i], missing, NULL)); 47408401ef6SPierre Jolivet PetscCheck(!*missing || !dd, PetscObjectComm((PetscObject)mat), PETSC_ERR_SUP, "First missing entry not yet implemented"); 475381b8e50SStefano Zampini } 476381b8e50SStefano Zampini } 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 478381b8e50SStefano Zampini } 479381b8e50SStefano Zampini 480d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyBegin_Nest(Mat A, MatAssemblyType type) 481d71ae5a4SJacob Faibussowitsch { 482d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 483d8588912SDave May PetscInt i, j; 48406a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 485d8588912SDave May 486d8588912SDave May PetscFunctionBegin; 487d8588912SDave May for (i = 0; i < vs->nr; i++) { 488d8588912SDave May for (j = 0; j < vs->nc; j++) { 48906a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 490e7c19651SJed Brown if (vs->m[i][j]) { 4919566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(vs->m[i][j], type)); 492e7c19651SJed Brown if (!vs->splitassembly) { 493e7c19651SJed Brown /* Note: split assembly will fail if the same block appears more than once (even indirectly through a nested 494e7c19651SJed Brown * sub-block). This could be fixed by adding a flag to Mat so that there was a way to check if a Mat was 495e7c19651SJed Brown * already performing an assembly, but the result would by more complicated and appears to offer less 496e7c19651SJed Brown * potential for diagnostics and correctness checking. Split assembly should be fixed once there is an 497e7c19651SJed Brown * interface for libraries to make asynchronous progress in "user-defined non-blocking collectives". 498e7c19651SJed Brown */ 4999566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(vs->m[i][j], type)); 5009566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(vs->m[i][j], &subnnzstate)); 501e7c19651SJed Brown } 502e7c19651SJed Brown } 50306a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || vs->nnzstate[i * vs->nc + j] != subnnzstate); 50406a1af2fSStefano Zampini vs->nnzstate[i * vs->nc + j] = subnnzstate; 505d8588912SDave May } 506d8588912SDave May } 50706a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 5083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 509d8588912SDave May } 510d8588912SDave May 511d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_Nest(Mat A, MatAssemblyType type) 512d71ae5a4SJacob Faibussowitsch { 513d8588912SDave May Mat_Nest *vs = (Mat_Nest *)A->data; 514d8588912SDave May PetscInt i, j; 515d8588912SDave May 516d8588912SDave May PetscFunctionBegin; 517d8588912SDave May for (i = 0; i < vs->nr; i++) { 518d8588912SDave May for (j = 0; j < vs->nc; j++) { 519e7c19651SJed Brown if (vs->m[i][j]) { 52048a46eb9SPierre Jolivet if (vs->splitassembly) PetscCall(MatAssemblyEnd(vs->m[i][j], type)); 521e7c19651SJed Brown } 522d8588912SDave May } 523d8588912SDave May } 5243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 525d8588912SDave May } 526d8588912SDave May 527d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindNonzeroSubMatRow(Mat A, PetscInt row, Mat *B) 528d71ae5a4SJacob Faibussowitsch { 529f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 530f349c1fdSJed Brown PetscInt j; 531f349c1fdSJed Brown Mat sub; 532d8588912SDave May 533d8588912SDave May PetscFunctionBegin; 5340298fd71SBarry Smith sub = (row < vs->nc) ? vs->m[row][row] : (Mat)NULL; /* Prefer to find on the diagonal */ 535f349c1fdSJed Brown for (j = 0; !sub && j < vs->nc; j++) sub = vs->m[row][j]; 5369566063dSJacob Faibussowitsch if (sub) PetscCall(MatSetUp(sub)); /* Ensure that the sizes are available */ 537f349c1fdSJed Brown *B = sub; 5383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 539d8588912SDave May } 540d8588912SDave May 541d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindNonzeroSubMatCol(Mat A, PetscInt col, Mat *B) 542d71ae5a4SJacob Faibussowitsch { 543f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 544f349c1fdSJed Brown PetscInt i; 545f349c1fdSJed Brown Mat sub; 546f349c1fdSJed Brown 547f349c1fdSJed Brown PetscFunctionBegin; 5480298fd71SBarry Smith sub = (col < vs->nr) ? vs->m[col][col] : (Mat)NULL; /* Prefer to find on the diagonal */ 549f349c1fdSJed Brown for (i = 0; !sub && i < vs->nr; i++) sub = vs->m[i][col]; 5509566063dSJacob Faibussowitsch if (sub) PetscCall(MatSetUp(sub)); /* Ensure that the sizes are available */ 551f349c1fdSJed Brown *B = sub; 5523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 553d8588912SDave May } 554d8588912SDave May 555d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindISRange(Mat A, PetscInt n, const IS list[], IS is, PetscInt *begin, PetscInt *end) 556d71ae5a4SJacob Faibussowitsch { 55718d228c0SPierre Jolivet PetscInt i, j, size, m; 558f349c1fdSJed Brown PetscBool flg; 55918d228c0SPierre Jolivet IS out, concatenate[2]; 560f349c1fdSJed Brown 561f349c1fdSJed Brown PetscFunctionBegin; 5624f572ea9SToby Isaac PetscAssertPointer(list, 3); 563f349c1fdSJed Brown PetscValidHeaderSpecific(is, IS_CLASSID, 4); 56418d228c0SPierre Jolivet if (begin) { 5654f572ea9SToby Isaac PetscAssertPointer(begin, 5); 56618d228c0SPierre Jolivet *begin = -1; 56718d228c0SPierre Jolivet } 56818d228c0SPierre Jolivet if (end) { 5694f572ea9SToby Isaac PetscAssertPointer(end, 6); 57018d228c0SPierre Jolivet *end = -1; 57118d228c0SPierre Jolivet } 572f349c1fdSJed Brown for (i = 0; i < n; i++) { 573207556f9SJed Brown if (!list[i]) continue; 5749566063dSJacob Faibussowitsch PetscCall(ISEqualUnsorted(list[i], is, &flg)); 575f349c1fdSJed Brown if (flg) { 57618d228c0SPierre Jolivet if (begin) *begin = i; 57718d228c0SPierre Jolivet if (end) *end = i + 1; 5783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 579f349c1fdSJed Brown } 580f349c1fdSJed Brown } 5819566063dSJacob Faibussowitsch PetscCall(ISGetSize(is, &size)); 58218d228c0SPierre Jolivet for (i = 0; i < n - 1; i++) { 58318d228c0SPierre Jolivet if (!list[i]) continue; 58418d228c0SPierre Jolivet m = 0; 5859566063dSJacob Faibussowitsch PetscCall(ISConcatenate(PetscObjectComm((PetscObject)A), 2, list + i, &out)); 5869566063dSJacob Faibussowitsch PetscCall(ISGetSize(out, &m)); 58718d228c0SPierre Jolivet for (j = i + 2; j < n && m < size; j++) { 58818d228c0SPierre Jolivet if (list[j]) { 58918d228c0SPierre Jolivet concatenate[0] = out; 59018d228c0SPierre Jolivet concatenate[1] = list[j]; 5919566063dSJacob Faibussowitsch PetscCall(ISConcatenate(PetscObjectComm((PetscObject)A), 2, concatenate, &out)); 5929566063dSJacob Faibussowitsch PetscCall(ISDestroy(concatenate)); 5939566063dSJacob Faibussowitsch PetscCall(ISGetSize(out, &m)); 59418d228c0SPierre Jolivet } 59518d228c0SPierre Jolivet } 59618d228c0SPierre Jolivet if (m == size) { 5979566063dSJacob Faibussowitsch PetscCall(ISEqualUnsorted(out, is, &flg)); 59818d228c0SPierre Jolivet if (flg) { 59918d228c0SPierre Jolivet if (begin) *begin = i; 60018d228c0SPierre Jolivet if (end) *end = j; 6019566063dSJacob Faibussowitsch PetscCall(ISDestroy(&out)); 6023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 60318d228c0SPierre Jolivet } 60418d228c0SPierre Jolivet } 6059566063dSJacob Faibussowitsch PetscCall(ISDestroy(&out)); 60618d228c0SPierre Jolivet } 6073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 608f349c1fdSJed Brown } 609f349c1fdSJed Brown 610d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFillEmptyMat_Private(Mat A, PetscInt i, PetscInt j, Mat *B) 611d71ae5a4SJacob Faibussowitsch { 6128188e55aSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 61318d228c0SPierre Jolivet PetscInt lr, lc; 61418d228c0SPierre Jolivet 61518d228c0SPierre Jolivet PetscFunctionBegin; 6169566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 6179566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.row[i], &lr)); 6189566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.col[j], &lc)); 6199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, lr, lc, PETSC_DECIDE, PETSC_DECIDE)); 6209566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATAIJ)); 6219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(*B, 0, NULL)); 6229566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(*B, 0, NULL, 0, NULL)); 6239566063dSJacob Faibussowitsch PetscCall(MatSetUp(*B)); 6249566063dSJacob Faibussowitsch PetscCall(MatSetOption(*B, MAT_NO_OFF_PROC_ENTRIES, PETSC_TRUE)); 6259566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 6269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 6273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 62818d228c0SPierre Jolivet } 62918d228c0SPierre Jolivet 630d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetBlock_Private(Mat A, PetscInt rbegin, PetscInt rend, PetscInt cbegin, PetscInt cend, Mat *B) 631d71ae5a4SJacob Faibussowitsch { 63218d228c0SPierre Jolivet Mat_Nest *vs = (Mat_Nest *)A->data; 63318d228c0SPierre Jolivet Mat *a; 63418d228c0SPierre Jolivet PetscInt i, j, k, l, nr = rend - rbegin, nc = cend - cbegin; 6358188e55aSJed Brown char keyname[256]; 63618d228c0SPierre Jolivet PetscBool *b; 63718d228c0SPierre Jolivet PetscBool flg; 6388188e55aSJed Brown 6398188e55aSJed Brown PetscFunctionBegin; 6400298fd71SBarry Smith *B = NULL; 6419566063dSJacob Faibussowitsch PetscCall(PetscSNPrintf(keyname, sizeof(keyname), "NestBlock_%" PetscInt_FMT "-%" PetscInt_FMT "x%" PetscInt_FMT "-%" PetscInt_FMT, rbegin, rend, cbegin, cend)); 6429566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, keyname, (PetscObject *)B)); 6433ba16761SJacob Faibussowitsch if (*B) PetscFunctionReturn(PETSC_SUCCESS); 6448188e55aSJed Brown 6459566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nr * nc, &a, nr * nc, &b)); 64618d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 64718d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 64818d228c0SPierre Jolivet a[i * nc + j] = vs->m[rbegin + i][cbegin + j]; 64918d228c0SPierre Jolivet b[i * nc + j] = PETSC_FALSE; 65018d228c0SPierre Jolivet } 65118d228c0SPierre Jolivet } 65218d228c0SPierre Jolivet if (nc != vs->nc && nr != vs->nr) { 65318d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 65418d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 65518d228c0SPierre Jolivet flg = PETSC_FALSE; 65618d228c0SPierre Jolivet for (k = 0; (k < nr && !flg); k++) { 65718d228c0SPierre Jolivet if (a[j + k * nc]) flg = PETSC_TRUE; 65818d228c0SPierre Jolivet } 65918d228c0SPierre Jolivet if (flg) { 66018d228c0SPierre Jolivet flg = PETSC_FALSE; 66118d228c0SPierre Jolivet for (l = 0; (l < nc && !flg); l++) { 66218d228c0SPierre Jolivet if (a[i * nc + l]) flg = PETSC_TRUE; 66318d228c0SPierre Jolivet } 66418d228c0SPierre Jolivet } 66518d228c0SPierre Jolivet if (!flg) { 66618d228c0SPierre Jolivet b[i * nc + j] = PETSC_TRUE; 6679566063dSJacob Faibussowitsch PetscCall(MatNestFillEmptyMat_Private(A, rbegin + i, cbegin + j, a + i * nc + j)); 66818d228c0SPierre Jolivet } 66918d228c0SPierre Jolivet } 67018d228c0SPierre Jolivet } 67118d228c0SPierre Jolivet } 6729566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nr, nr != vs->nr ? NULL : vs->isglobal.row, nc, nc != vs->nc ? NULL : vs->isglobal.col, a, B)); 67318d228c0SPierre Jolivet for (i = 0; i < nr; i++) { 67418d228c0SPierre Jolivet for (j = 0; j < nc; j++) { 67548a46eb9SPierre Jolivet if (b[i * nc + j]) PetscCall(MatDestroy(a + i * nc + j)); 67618d228c0SPierre Jolivet } 67718d228c0SPierre Jolivet } 6789566063dSJacob Faibussowitsch PetscCall(PetscFree2(a, b)); 6798188e55aSJed Brown (*B)->assembled = A->assembled; 6809566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, keyname, (PetscObject)*B)); 6819566063dSJacob Faibussowitsch PetscCall(PetscObjectDereference((PetscObject)*B)); /* Leave the only remaining reference in the composition */ 6823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6838188e55aSJed Brown } 6848188e55aSJed Brown 685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestFindSubMat(Mat A, struct MatNestISPair *is, IS isrow, IS iscol, Mat *B) 686d71ae5a4SJacob Faibussowitsch { 687f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 68818d228c0SPierre Jolivet PetscInt rbegin, rend, cbegin, cend; 689f349c1fdSJed Brown 690f349c1fdSJed Brown PetscFunctionBegin; 6919566063dSJacob Faibussowitsch PetscCall(MatNestFindISRange(A, vs->nr, is->row, isrow, &rbegin, &rend)); 6929566063dSJacob Faibussowitsch PetscCall(MatNestFindISRange(A, vs->nc, is->col, iscol, &cbegin, &cend)); 69318d228c0SPierre Jolivet if (rend == rbegin + 1 && cend == cbegin + 1) { 69448a46eb9SPierre Jolivet if (!vs->m[rbegin][cbegin]) PetscCall(MatNestFillEmptyMat_Private(A, rbegin, cbegin, vs->m[rbegin] + cbegin)); 69518d228c0SPierre Jolivet *B = vs->m[rbegin][cbegin]; 69618d228c0SPierre Jolivet } else if (rbegin != -1 && cbegin != -1) { 6979566063dSJacob Faibussowitsch PetscCall(MatNestGetBlock_Private(A, rbegin, rend, cbegin, cend, B)); 69818d228c0SPierre Jolivet } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Could not find index set"); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 700f349c1fdSJed Brown } 701f349c1fdSJed Brown 70206a1af2fSStefano Zampini /* 70306a1af2fSStefano Zampini TODO: This does not actually returns a submatrix we can modify 70406a1af2fSStefano Zampini */ 705d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrix_Nest(Mat A, IS isrow, IS iscol, MatReuse reuse, Mat *B) 706d71ae5a4SJacob Faibussowitsch { 707f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 708f349c1fdSJed Brown Mat sub; 709f349c1fdSJed Brown 710f349c1fdSJed Brown PetscFunctionBegin; 7119566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->isglobal, isrow, iscol, &sub)); 712f349c1fdSJed Brown switch (reuse) { 713f349c1fdSJed Brown case MAT_INITIAL_MATRIX: 7149566063dSJacob Faibussowitsch if (sub) PetscCall(PetscObjectReference((PetscObject)sub)); 715f349c1fdSJed Brown *B = sub; 716f349c1fdSJed Brown break; 717d71ae5a4SJacob Faibussowitsch case MAT_REUSE_MATRIX: 718d71ae5a4SJacob Faibussowitsch PetscCheck(sub == *B, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Submatrix was not used before in this call"); 719d71ae5a4SJacob Faibussowitsch break; 720d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_MATRIX: /* Nothing to do */ 721d71ae5a4SJacob Faibussowitsch break; 722d71ae5a4SJacob Faibussowitsch case MAT_INPLACE_MATRIX: /* Nothing to do */ 723d71ae5a4SJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "MAT_INPLACE_MATRIX is not supported yet"); 724f349c1fdSJed Brown } 7253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 726f349c1fdSJed Brown } 727f349c1fdSJed Brown 72866976f2fSJacob Faibussowitsch static PetscErrorCode MatGetLocalSubMatrix_Nest(Mat A, IS isrow, IS iscol, Mat *B) 729d71ae5a4SJacob Faibussowitsch { 730f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 731f349c1fdSJed Brown Mat sub; 732f349c1fdSJed Brown 733f349c1fdSJed Brown PetscFunctionBegin; 7349566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->islocal, isrow, iscol, &sub)); 735f349c1fdSJed Brown /* We allow the submatrix to be NULL, perhaps it would be better for the user to return an empty matrix instead */ 7369566063dSJacob Faibussowitsch if (sub) PetscCall(PetscObjectReference((PetscObject)sub)); 737f349c1fdSJed Brown *B = sub; 7383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 739d8588912SDave May } 740d8588912SDave May 741d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreLocalSubMatrix_Nest(Mat A, IS isrow, IS iscol, Mat *B) 742d71ae5a4SJacob Faibussowitsch { 743f349c1fdSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 744f349c1fdSJed Brown Mat sub; 745d8588912SDave May 746d8588912SDave May PetscFunctionBegin; 7479566063dSJacob Faibussowitsch PetscCall(MatNestFindSubMat(A, &vs->islocal, isrow, iscol, &sub)); 74808401ef6SPierre Jolivet PetscCheck(*B == sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Local submatrix has not been gotten"); 749f349c1fdSJed Brown if (sub) { 750aed4548fSBarry Smith PetscCheck(((PetscObject)sub)->refct > 1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Local submatrix has had reference count decremented too many times"); 7519566063dSJacob Faibussowitsch PetscCall(MatDestroy(B)); 752d8588912SDave May } 7533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 754d8588912SDave May } 755d8588912SDave May 756d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_Nest(Mat A, Vec v) 757d71ae5a4SJacob Faibussowitsch { 7587874fa86SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 7597874fa86SDave May PetscInt i; 7607874fa86SDave May 7617874fa86SDave May PetscFunctionBegin; 7627874fa86SDave May for (i = 0; i < bA->nr; i++) { 763429bac76SJed Brown Vec bv; 7649566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(v, bA->isglobal.row[i], &bv)); 7657874fa86SDave May if (bA->m[i][i]) { 7669566063dSJacob Faibussowitsch PetscCall(MatGetDiagonal(bA->m[i][i], bv)); 7677874fa86SDave May } else { 7689566063dSJacob Faibussowitsch PetscCall(VecSet(bv, 0.0)); 7697874fa86SDave May } 7709566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(v, bA->isglobal.row[i], &bv)); 7717874fa86SDave May } 7723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7737874fa86SDave May } 7747874fa86SDave May 775d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDiagonalScale_Nest(Mat A, Vec l, Vec r) 776d71ae5a4SJacob Faibussowitsch { 7777874fa86SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 778429bac76SJed Brown Vec bl, *br; 7797874fa86SDave May PetscInt i, j; 7807874fa86SDave May 7817874fa86SDave May PetscFunctionBegin; 7829566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(bA->nc, &br)); 7832e6472ebSElliott Sales de Andrade if (r) { 7849566063dSJacob Faibussowitsch for (j = 0; j < bA->nc; j++) PetscCall(VecGetSubVector(r, bA->isglobal.col[j], &br[j])); 7852e6472ebSElliott Sales de Andrade } 7862e6472ebSElliott Sales de Andrade bl = NULL; 7877874fa86SDave May for (i = 0; i < bA->nr; i++) { 78848a46eb9SPierre Jolivet if (l) PetscCall(VecGetSubVector(l, bA->isglobal.row[i], &bl)); 7897874fa86SDave May for (j = 0; j < bA->nc; j++) { 79048a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatDiagonalScale(bA->m[i][j], bl, br[j])); 7917874fa86SDave May } 79248a46eb9SPierre Jolivet if (l) PetscCall(VecRestoreSubVector(l, bA->isglobal.row[i], &bl)); 7932e6472ebSElliott Sales de Andrade } 7942e6472ebSElliott Sales de Andrade if (r) { 7959566063dSJacob Faibussowitsch for (j = 0; j < bA->nc; j++) PetscCall(VecRestoreSubVector(r, bA->isglobal.col[j], &br[j])); 7962e6472ebSElliott Sales de Andrade } 7979566063dSJacob Faibussowitsch PetscCall(PetscFree(br)); 7983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7997874fa86SDave May } 8007874fa86SDave May 801d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatScale_Nest(Mat A, PetscScalar a) 802d71ae5a4SJacob Faibussowitsch { 803a061e289SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 804a061e289SJed Brown PetscInt i, j; 805a061e289SJed Brown 806a061e289SJed Brown PetscFunctionBegin; 807a061e289SJed Brown for (i = 0; i < bA->nr; i++) { 808a061e289SJed Brown for (j = 0; j < bA->nc; j++) { 80948a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatScale(bA->m[i][j], a)); 810a061e289SJed Brown } 811a061e289SJed Brown } 8123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a061e289SJed Brown } 814a061e289SJed Brown 815d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatShift_Nest(Mat A, PetscScalar a) 816d71ae5a4SJacob Faibussowitsch { 817a061e289SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 818a061e289SJed Brown PetscInt i; 81906a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 820a061e289SJed Brown 821a061e289SJed Brown PetscFunctionBegin; 822a061e289SJed Brown for (i = 0; i < bA->nr; i++) { 82306a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 82408401ef6SPierre Jolivet PetscCheck(bA->m[i][i], PetscObjectComm((PetscObject)A), PETSC_ERR_SUP, "No support for shifting an empty diagonal block, insert a matrix in block (%" PetscInt_FMT ",%" PetscInt_FMT ")", i, i); 8259566063dSJacob Faibussowitsch PetscCall(MatShift(bA->m[i][i], a)); 8269566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bA->m[i][i], &subnnzstate)); 82706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i * bA->nc + i] != subnnzstate); 82806a1af2fSStefano Zampini bA->nnzstate[i * bA->nc + i] = subnnzstate; 829a061e289SJed Brown } 83006a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 8313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 832a061e289SJed Brown } 833a061e289SJed Brown 834d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDiagonalSet_Nest(Mat A, Vec D, InsertMode is) 835d71ae5a4SJacob Faibussowitsch { 83613135bc6SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data; 83713135bc6SAlex Fikl PetscInt i; 83806a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 83913135bc6SAlex Fikl 84013135bc6SAlex Fikl PetscFunctionBegin; 84113135bc6SAlex Fikl for (i = 0; i < bA->nr; i++) { 84206a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 84313135bc6SAlex Fikl Vec bv; 8449566063dSJacob Faibussowitsch PetscCall(VecGetSubVector(D, bA->isglobal.row[i], &bv)); 84513135bc6SAlex Fikl if (bA->m[i][i]) { 8469566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet(bA->m[i][i], bv, is)); 8479566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bA->m[i][i], &subnnzstate)); 84813135bc6SAlex Fikl } 8499566063dSJacob Faibussowitsch PetscCall(VecRestoreSubVector(D, bA->isglobal.row[i], &bv)); 85006a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bA->nnzstate[i * bA->nc + i] != subnnzstate); 85106a1af2fSStefano Zampini bA->nnzstate[i * bA->nc + i] = subnnzstate; 85213135bc6SAlex Fikl } 85306a1af2fSStefano Zampini if (nnzstate) A->nonzerostate++; 8543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 85513135bc6SAlex Fikl } 85613135bc6SAlex Fikl 857d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_Nest(Mat A, PetscRandom rctx) 858d71ae5a4SJacob Faibussowitsch { 859f8170845SAlex Fikl Mat_Nest *bA = (Mat_Nest *)A->data; 860f8170845SAlex Fikl PetscInt i, j; 861f8170845SAlex Fikl 862f8170845SAlex Fikl PetscFunctionBegin; 863f8170845SAlex Fikl for (i = 0; i < bA->nr; i++) { 864f8170845SAlex Fikl for (j = 0; j < bA->nc; j++) { 86548a46eb9SPierre Jolivet if (bA->m[i][j]) PetscCall(MatSetRandom(bA->m[i][j], rctx)); 866f8170845SAlex Fikl } 867f8170845SAlex Fikl } 8683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 869f8170845SAlex Fikl } 870f8170845SAlex Fikl 871d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCreateVecs_Nest(Mat A, Vec *right, Vec *left) 872d71ae5a4SJacob Faibussowitsch { 873d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 874d8588912SDave May Vec *L, *R; 875d8588912SDave May MPI_Comm comm; 876d8588912SDave May PetscInt i, j; 877d8588912SDave May 878d8588912SDave May PetscFunctionBegin; 8799566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)A, &comm)); 880d8588912SDave May if (right) { 881d8588912SDave May /* allocate R */ 8829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bA->nc, &R)); 883d8588912SDave May /* Create the right vectors */ 884d8588912SDave May for (j = 0; j < bA->nc; j++) { 885d8588912SDave May for (i = 0; i < bA->nr; i++) { 886d8588912SDave May if (bA->m[i][j]) { 8879566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(bA->m[i][j], &R[j], NULL)); 888d8588912SDave May break; 889d8588912SDave May } 890d8588912SDave May } 89108401ef6SPierre Jolivet PetscCheck(i != bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null column."); 892d8588912SDave May } 8939566063dSJacob Faibussowitsch PetscCall(VecCreateNest(comm, bA->nc, bA->isglobal.col, R, right)); 894d8588912SDave May /* hand back control to the nest vector */ 89548a46eb9SPierre Jolivet for (j = 0; j < bA->nc; j++) PetscCall(VecDestroy(&R[j])); 8969566063dSJacob Faibussowitsch PetscCall(PetscFree(R)); 897d8588912SDave May } 898d8588912SDave May 899d8588912SDave May if (left) { 900d8588912SDave May /* allocate L */ 9019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bA->nr, &L)); 902d8588912SDave May /* Create the left vectors */ 903d8588912SDave May for (i = 0; i < bA->nr; i++) { 904d8588912SDave May for (j = 0; j < bA->nc; j++) { 905d8588912SDave May if (bA->m[i][j]) { 9069566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(bA->m[i][j], NULL, &L[i])); 907d8588912SDave May break; 908d8588912SDave May } 909d8588912SDave May } 91008401ef6SPierre Jolivet PetscCheck(j != bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Mat(Nest) contains a null row."); 911d8588912SDave May } 912d8588912SDave May 9139566063dSJacob Faibussowitsch PetscCall(VecCreateNest(comm, bA->nr, bA->isglobal.row, L, left)); 91448a46eb9SPierre Jolivet for (i = 0; i < bA->nr; i++) PetscCall(VecDestroy(&L[i])); 915d8588912SDave May 9169566063dSJacob Faibussowitsch PetscCall(PetscFree(L)); 917d8588912SDave May } 9183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 919d8588912SDave May } 920d8588912SDave May 921d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_Nest(Mat A, PetscViewer viewer) 922d71ae5a4SJacob Faibussowitsch { 923d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 92429e60adbSStefano Zampini PetscBool isascii, viewSub = PETSC_FALSE; 925d8588912SDave May PetscInt i, j; 926d8588912SDave May 927d8588912SDave May PetscFunctionBegin; 9289566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii)); 929d8588912SDave May if (isascii) { 9309566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)A)->options, ((PetscObject)A)->prefix, "-mat_view_nest_sub", &viewSub, NULL)); 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "Matrix object:\n")); 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushTab(viewer)); 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "type=nest, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT "\n", bA->nr, bA->nc)); 934d8588912SDave May 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "MatNest structure:\n")); 936d8588912SDave May for (i = 0; i < bA->nr; i++) { 937d8588912SDave May for (j = 0; j < bA->nc; j++) { 93819fd82e9SBarry Smith MatType type; 939270f95d7SJed Brown char name[256] = "", prefix[256] = ""; 940d8588912SDave May PetscInt NR, NC; 941d8588912SDave May PetscBool isNest = PETSC_FALSE; 942d8588912SDave May 943d8588912SDave May if (!bA->m[i][j]) { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : NULL\n", i, j)); 945d8588912SDave May continue; 946d8588912SDave May } 9479566063dSJacob Faibussowitsch PetscCall(MatGetSize(bA->m[i][j], &NR, &NC)); 9489566063dSJacob Faibussowitsch PetscCall(MatGetType(bA->m[i][j], &type)); 9499566063dSJacob Faibussowitsch if (((PetscObject)bA->m[i][j])->name) PetscCall(PetscSNPrintf(name, sizeof(name), "name=\"%s\", ", ((PetscObject)bA->m[i][j])->name)); 9509566063dSJacob Faibussowitsch if (((PetscObject)bA->m[i][j])->prefix) PetscCall(PetscSNPrintf(prefix, sizeof(prefix), "prefix=\"%s\", ", ((PetscObject)bA->m[i][j])->prefix)); 9519566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)bA->m[i][j], MATNEST, &isNest)); 952d8588912SDave May 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "(%" PetscInt_FMT ",%" PetscInt_FMT ") : %s%stype=%s, rows=%" PetscInt_FMT ", cols=%" PetscInt_FMT "\n", i, j, name, prefix, type, NR, NC)); 954d8588912SDave May 95529e60adbSStefano Zampini if (isNest || viewSub) { 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPushTab(viewer)); /* push1 */ 9579566063dSJacob Faibussowitsch PetscCall(MatView(bA->m[i][j], viewer)); 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopTab(viewer)); /* pop1 */ 959d8588912SDave May } 960d8588912SDave May } 961d8588912SDave May } 9629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPopTab(viewer)); /* pop0 */ 963d8588912SDave May } 9643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 965d8588912SDave May } 966d8588912SDave May 967d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatZeroEntries_Nest(Mat A) 968d71ae5a4SJacob Faibussowitsch { 969d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 970d8588912SDave May PetscInt i, j; 971d8588912SDave May 972d8588912SDave May PetscFunctionBegin; 973d8588912SDave May for (i = 0; i < bA->nr; i++) { 974d8588912SDave May for (j = 0; j < bA->nc; j++) { 975d8588912SDave May if (!bA->m[i][j]) continue; 9769566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(bA->m[i][j])); 977d8588912SDave May } 978d8588912SDave May } 9793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 980d8588912SDave May } 981d8588912SDave May 982d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatCopy_Nest(Mat A, Mat B, MatStructure str) 983d71ae5a4SJacob Faibussowitsch { 984c222c20dSDavid Ham Mat_Nest *bA = (Mat_Nest *)A->data, *bB = (Mat_Nest *)B->data; 985c222c20dSDavid Ham PetscInt i, j, nr = bA->nr, nc = bA->nc; 98606a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 987c222c20dSDavid Ham 988c222c20dSDavid Ham PetscFunctionBegin; 989aed4548fSBarry Smith PetscCheck(nr == bB->nr && nc == bB->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Cannot copy a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") to a Mat_Nest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")", bB->nr, bB->nc, nr, nc); 990c222c20dSDavid Ham for (i = 0; i < nr; i++) { 991c222c20dSDavid Ham for (j = 0; j < nc; j++) { 99206a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 99346a2b97cSJed Brown if (bA->m[i][j] && bB->m[i][j]) { 9949566063dSJacob Faibussowitsch PetscCall(MatCopy(bA->m[i][j], bB->m[i][j], str)); 99508401ef6SPierre Jolivet } else PetscCheck(!bA->m[i][j] && !bB->m[i][j], PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_INCOMP, "Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT, i, j); 9969566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(bB->m[i][j], &subnnzstate)); 99706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bB->nnzstate[i * nc + j] != subnnzstate); 99806a1af2fSStefano Zampini bB->nnzstate[i * nc + j] = subnnzstate; 999c222c20dSDavid Ham } 1000c222c20dSDavid Ham } 100106a1af2fSStefano Zampini if (nnzstate) B->nonzerostate++; 10023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1003c222c20dSDavid Ham } 1004c222c20dSDavid Ham 1005d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatAXPY_Nest(Mat Y, PetscScalar a, Mat X, MatStructure str) 1006d71ae5a4SJacob Faibussowitsch { 10076e76ffeaSPierre Jolivet Mat_Nest *bY = (Mat_Nest *)Y->data, *bX = (Mat_Nest *)X->data; 10086e76ffeaSPierre Jolivet PetscInt i, j, nr = bY->nr, nc = bY->nc; 100906a1af2fSStefano Zampini PetscBool nnzstate = PETSC_FALSE; 10106e76ffeaSPierre Jolivet 10116e76ffeaSPierre Jolivet PetscFunctionBegin; 1012aed4548fSBarry Smith PetscCheck(nr == bX->nr && nc == bX->nc, PetscObjectComm((PetscObject)Y), PETSC_ERR_ARG_INCOMP, "Cannot AXPY a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ") with a MatNest of block size (%" PetscInt_FMT ",%" PetscInt_FMT ")", bX->nr, bX->nc, nr, nc); 10136e76ffeaSPierre Jolivet for (i = 0; i < nr; i++) { 10146e76ffeaSPierre Jolivet for (j = 0; j < nc; j++) { 101506a1af2fSStefano Zampini PetscObjectState subnnzstate = 0; 10166e76ffeaSPierre Jolivet if (bY->m[i][j] && bX->m[i][j]) { 10179566063dSJacob Faibussowitsch PetscCall(MatAXPY(bY->m[i][j], a, bX->m[i][j], str)); 1018c066aebcSStefano Zampini } else if (bX->m[i][j]) { 1019c066aebcSStefano Zampini Mat M; 1020c066aebcSStefano Zampini 1021e75569e9SPierre Jolivet PetscCheck(str == DIFFERENT_NONZERO_PATTERN || str == UNKNOWN_NONZERO_PATTERN, PetscObjectComm((PetscObject)Y), PETSC_ERR_ARG_INCOMP, "Matrix block does not exist at %" PetscInt_FMT ",%" PetscInt_FMT ". Use DIFFERENT_NONZERO_PATTERN or UNKNOWN_NONZERO_PATTERN", i, j); 10229566063dSJacob Faibussowitsch PetscCall(MatDuplicate(bX->m[i][j], MAT_COPY_VALUES, &M)); 10239566063dSJacob Faibussowitsch PetscCall(MatNestSetSubMat(Y, i, j, M)); 10249566063dSJacob Faibussowitsch PetscCall(MatDestroy(&M)); 1025c066aebcSStefano Zampini } 10269566063dSJacob Faibussowitsch if (bY->m[i][j]) PetscCall(MatGetNonzeroState(bY->m[i][j], &subnnzstate)); 102706a1af2fSStefano Zampini nnzstate = (PetscBool)(nnzstate || bY->nnzstate[i * nc + j] != subnnzstate); 102806a1af2fSStefano Zampini bY->nnzstate[i * nc + j] = subnnzstate; 10296e76ffeaSPierre Jolivet } 10306e76ffeaSPierre Jolivet } 103106a1af2fSStefano Zampini if (nnzstate) Y->nonzerostate++; 10323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10336e76ffeaSPierre Jolivet } 10346e76ffeaSPierre Jolivet 1035d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatDuplicate_Nest(Mat A, MatDuplicateOption op, Mat *B) 1036d71ae5a4SJacob Faibussowitsch { 1037d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 1038841e96a3SJed Brown Mat *b; 1039841e96a3SJed Brown PetscInt i, j, nr = bA->nr, nc = bA->nc; 1040d8588912SDave May 1041d8588912SDave May PetscFunctionBegin; 10429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr * nc, &b)); 1043841e96a3SJed Brown for (i = 0; i < nr; i++) { 1044841e96a3SJed Brown for (j = 0; j < nc; j++) { 1045841e96a3SJed Brown if (bA->m[i][j]) { 10469566063dSJacob Faibussowitsch PetscCall(MatDuplicate(bA->m[i][j], op, &b[i * nc + j])); 1047841e96a3SJed Brown } else { 10480298fd71SBarry Smith b[i * nc + j] = NULL; 1049d8588912SDave May } 1050d8588912SDave May } 1051d8588912SDave May } 10529566063dSJacob Faibussowitsch PetscCall(MatCreateNest(PetscObjectComm((PetscObject)A), nr, bA->isglobal.row, nc, bA->isglobal.col, b, B)); 1053841e96a3SJed Brown /* Give the new MatNest exclusive ownership */ 105448a46eb9SPierre Jolivet for (i = 0; i < nr * nc; i++) PetscCall(MatDestroy(&b[i])); 10559566063dSJacob Faibussowitsch PetscCall(PetscFree(b)); 1056d8588912SDave May 10579566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 10589566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 10593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1060d8588912SDave May } 1061d8588912SDave May 1062d8588912SDave May /* nest api */ 106366976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSubMat_Nest(Mat A, PetscInt idxm, PetscInt jdxm, Mat *mat) 1064d71ae5a4SJacob Faibussowitsch { 1065d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 10665fd66863SKarl Rupp 1067d8588912SDave May PetscFunctionBegin; 106808401ef6SPierre Jolivet PetscCheck(idxm < bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, idxm, bA->nr - 1); 106908401ef6SPierre Jolivet PetscCheck(jdxm < bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT, jdxm, bA->nc - 1); 1070d8588912SDave May *mat = bA->m[idxm][jdxm]; 10713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1072d8588912SDave May } 1073d8588912SDave May 10749ba0d327SJed Brown /*@ 107511a5261eSBarry Smith MatNestGetSubMat - Returns a single, sub-matrix from a `MATNEST` 1076d8588912SDave May 10772ef1f0ffSBarry Smith Not Collective 1078d8588912SDave May 1079d8588912SDave May Input Parameters: 108011a5261eSBarry Smith + A - `MATNEST` matrix 1081d8588912SDave May . idxm - index of the matrix within the nest matrix 1082629881c0SJed Brown - jdxm - index of the matrix within the nest matrix 1083d8588912SDave May 1084d8588912SDave May Output Parameter: 10852ef1f0ffSBarry Smith . sub - matrix at index `idxm`, `jdxm` within the nest matrix 1086d8588912SDave May 1087d8588912SDave May Level: developer 1088d8588912SDave May 1089fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSize()`, `MatNestGetSubMats()`, `MatCreateNest()`, `MatNestSetSubMat()`, 1090db781477SPatrick Sanan `MatNestGetLocalISs()`, `MatNestGetISs()` 1091d8588912SDave May @*/ 1092d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSubMat(Mat A, PetscInt idxm, PetscInt jdxm, Mat *sub) 1093d71ae5a4SJacob Faibussowitsch { 1094d8588912SDave May PetscFunctionBegin; 1095cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSubMat_C", (Mat, PetscInt, PetscInt, Mat *), (A, idxm, jdxm, sub)); 10963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1097d8588912SDave May } 1098d8588912SDave May 109966976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetSubMat_Nest(Mat A, PetscInt idxm, PetscInt jdxm, Mat mat) 1100d71ae5a4SJacob Faibussowitsch { 11010782ca92SJed Brown Mat_Nest *bA = (Mat_Nest *)A->data; 11020782ca92SJed Brown PetscInt m, n, M, N, mi, ni, Mi, Ni; 11030782ca92SJed Brown 11040782ca92SJed Brown PetscFunctionBegin; 110508401ef6SPierre Jolivet PetscCheck(idxm < bA->nr, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, idxm, bA->nr - 1); 110608401ef6SPierre Jolivet PetscCheck(jdxm < bA->nc, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Col too large: row %" PetscInt_FMT " max %" PetscInt_FMT, jdxm, bA->nc - 1); 11079566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(mat, &m, &n)); 11089566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 11099566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.row[idxm], &mi)); 11109566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.row[idxm], &Mi)); 11119566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(bA->isglobal.col[jdxm], &ni)); 11129566063dSJacob Faibussowitsch PetscCall(ISGetSize(bA->isglobal.col[jdxm], &Ni)); 1113aed4548fSBarry Smith PetscCheck(M == Mi && N == Ni, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_INCOMP, "Submatrix dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")", M, N, Mi, Ni); 1114aed4548fSBarry Smith PetscCheck(m == mi && n == ni, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_INCOMP, "Submatrix local dimension (%" PetscInt_FMT ",%" PetscInt_FMT ") incompatible with nest block (%" PetscInt_FMT ",%" PetscInt_FMT ")", m, n, mi, ni); 111526fbe8dcSKarl Rupp 111606a1af2fSStefano Zampini /* do not increase object state */ 11173ba16761SJacob Faibussowitsch if (mat == bA->m[idxm][jdxm]) PetscFunctionReturn(PETSC_SUCCESS); 111806a1af2fSStefano Zampini 11199566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)mat)); 11209566063dSJacob Faibussowitsch PetscCall(MatDestroy(&bA->m[idxm][jdxm])); 11210782ca92SJed Brown bA->m[idxm][jdxm] = mat; 11229566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 11239566063dSJacob Faibussowitsch PetscCall(MatGetNonzeroState(mat, &bA->nnzstate[idxm * bA->nc + jdxm])); 112406a1af2fSStefano Zampini A->nonzerostate++; 11253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11260782ca92SJed Brown } 11270782ca92SJed Brown 11289ba0d327SJed Brown /*@ 112911a5261eSBarry Smith MatNestSetSubMat - Set a single submatrix in the `MATNEST` 11300782ca92SJed Brown 11312ef1f0ffSBarry Smith Logically Collective 11320782ca92SJed Brown 11330782ca92SJed Brown Input Parameters: 113411a5261eSBarry Smith + A - `MATNEST` matrix 11350782ca92SJed Brown . idxm - index of the matrix within the nest matrix 11360782ca92SJed Brown . jdxm - index of the matrix within the nest matrix 11372ef1f0ffSBarry Smith - sub - matrix at index `idxm`, `jdxm` within the nest matrix 11382ef1f0ffSBarry Smith 11392ef1f0ffSBarry Smith Level: developer 11400782ca92SJed Brown 11410782ca92SJed Brown Notes: 11420782ca92SJed Brown The new submatrix must have the same size and communicator as that block of the nest. 11430782ca92SJed Brown 11440782ca92SJed Brown This increments the reference count of the submatrix. 11450782ca92SJed Brown 1146fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestSetSubMats()`, `MatNestGetSubMats()`, `MatNestGetLocalISs()`, `MatCreateNest()`, 1147db781477SPatrick Sanan `MatNestGetSubMat()`, `MatNestGetISs()`, `MatNestGetSize()` 11480782ca92SJed Brown @*/ 1149d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetSubMat(Mat A, PetscInt idxm, PetscInt jdxm, Mat sub) 1150d71ae5a4SJacob Faibussowitsch { 11510782ca92SJed Brown PetscFunctionBegin; 1152cac4c232SBarry Smith PetscUseMethod(A, "MatNestSetSubMat_C", (Mat, PetscInt, PetscInt, Mat), (A, idxm, jdxm, sub)); 11533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11540782ca92SJed Brown } 11550782ca92SJed Brown 115666976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSubMats_Nest(Mat A, PetscInt *M, PetscInt *N, Mat ***mat) 1157d71ae5a4SJacob Faibussowitsch { 1158d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 11595fd66863SKarl Rupp 1160d8588912SDave May PetscFunctionBegin; 116126fbe8dcSKarl Rupp if (M) *M = bA->nr; 116226fbe8dcSKarl Rupp if (N) *N = bA->nc; 116326fbe8dcSKarl Rupp if (mat) *mat = bA->m; 11643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1165d8588912SDave May } 1166d8588912SDave May 1167d8588912SDave May /*@C 116811a5261eSBarry Smith MatNestGetSubMats - Returns the entire two dimensional array of matrices defining a `MATNEST` matrix. 1169d8588912SDave May 11702ef1f0ffSBarry Smith Not Collective 1171d8588912SDave May 1172f899ff85SJose E. Roman Input Parameter: 1173629881c0SJed Brown . A - nest matrix 1174d8588912SDave May 1175d8d19677SJose E. Roman Output Parameters: 1176629881c0SJed Brown + M - number of rows in the nest matrix 1177d8588912SDave May . N - number of cols in the nest matrix 1178e9d3347aSJose E. Roman - mat - array of matrices 1179d8588912SDave May 11802ef1f0ffSBarry Smith Level: developer 11812ef1f0ffSBarry Smith 118211a5261eSBarry Smith Note: 11832ef1f0ffSBarry Smith The user should not free the array `mat`. 1184d8588912SDave May 1185fe59aa6dSJacob Faibussowitsch Fortran Notes: 118611a5261eSBarry Smith This routine has a calling sequence 1187351962e3SVincent Le Chenadec $ call MatNestGetSubMats(A, M, N, mat, ierr) 118820f4b53cSBarry Smith where the space allocated for the optional argument `mat` is assumed large enough (if provided). 1189e9d3347aSJose E. Roman Matrices in `mat` are returned in row-major order, see `MatCreateNest()` for an example. 1190351962e3SVincent Le Chenadec 1191fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSize()`, `MatNestGetSubMat()`, `MatNestGetLocalISs()`, `MatCreateNest()`, 1192db781477SPatrick Sanan `MatNestSetSubMats()`, `MatNestGetISs()`, `MatNestSetSubMat()` 1193d8588912SDave May @*/ 1194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSubMats(Mat A, PetscInt *M, PetscInt *N, Mat ***mat) 1195d71ae5a4SJacob Faibussowitsch { 1196d8588912SDave May PetscFunctionBegin; 1197cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSubMats_C", (Mat, PetscInt *, PetscInt *, Mat ***), (A, M, N, mat)); 11983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1199d8588912SDave May } 1200d8588912SDave May 120166976f2fSJacob Faibussowitsch static PetscErrorCode MatNestGetSize_Nest(Mat A, PetscInt *M, PetscInt *N) 1202d71ae5a4SJacob Faibussowitsch { 1203d8588912SDave May Mat_Nest *bA = (Mat_Nest *)A->data; 1204d8588912SDave May 1205d8588912SDave May PetscFunctionBegin; 120626fbe8dcSKarl Rupp if (M) *M = bA->nr; 120726fbe8dcSKarl Rupp if (N) *N = bA->nc; 12083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1209d8588912SDave May } 1210d8588912SDave May 12119ba0d327SJed Brown /*@ 121211a5261eSBarry Smith MatNestGetSize - Returns the size of the `MATNEST` matrix. 1213d8588912SDave May 12142ef1f0ffSBarry Smith Not Collective 1215d8588912SDave May 1216f899ff85SJose E. Roman Input Parameter: 121711a5261eSBarry Smith . A - `MATNEST` matrix 1218d8588912SDave May 1219d8d19677SJose E. Roman Output Parameters: 1220629881c0SJed Brown + M - number of rows in the nested mat 1221629881c0SJed Brown - N - number of cols in the nested mat 1222d8588912SDave May 1223d8588912SDave May Level: developer 1224d8588912SDave May 1225fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatCreateNest()`, `MatNestGetLocalISs()`, 1226db781477SPatrick Sanan `MatNestGetISs()` 1227d8588912SDave May @*/ 1228d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetSize(Mat A, PetscInt *M, PetscInt *N) 1229d71ae5a4SJacob Faibussowitsch { 1230d8588912SDave May PetscFunctionBegin; 1231cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetSize_C", (Mat, PetscInt *, PetscInt *), (A, M, N)); 12323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1233d8588912SDave May } 1234d8588912SDave May 1235d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetISs_Nest(Mat A, IS rows[], IS cols[]) 1236d71ae5a4SJacob Faibussowitsch { 1237900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 1238900e7ff2SJed Brown PetscInt i; 1239900e7ff2SJed Brown 1240900e7ff2SJed Brown PetscFunctionBegin; 12419371c9d4SSatish Balay if (rows) 12429371c9d4SSatish Balay for (i = 0; i < vs->nr; i++) rows[i] = vs->isglobal.row[i]; 12439371c9d4SSatish Balay if (cols) 12449371c9d4SSatish Balay for (i = 0; i < vs->nc; i++) cols[i] = vs->isglobal.col[i]; 12453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1246900e7ff2SJed Brown } 1247900e7ff2SJed Brown 12483a4d7b9aSSatish Balay /*@C 124911a5261eSBarry Smith MatNestGetISs - Returns the index sets partitioning the row and column spaces of a `MATNEST` 1250900e7ff2SJed Brown 12512ef1f0ffSBarry Smith Not Collective 1252900e7ff2SJed Brown 1253f899ff85SJose E. Roman Input Parameter: 125411a5261eSBarry Smith . A - `MATNEST` matrix 1255900e7ff2SJed Brown 1256d8d19677SJose E. Roman Output Parameters: 1257900e7ff2SJed Brown + rows - array of row index sets 1258900e7ff2SJed Brown - cols - array of column index sets 1259900e7ff2SJed Brown 1260900e7ff2SJed Brown Level: advanced 1261900e7ff2SJed Brown 126211a5261eSBarry Smith Note: 12632ef1f0ffSBarry Smith The user must have allocated arrays of the correct size. The reference count is not increased on the returned `IS`s. 1264900e7ff2SJed Brown 1265fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatNestGetSize()`, `MatNestGetLocalISs()`, 1266fe59aa6dSJacob Faibussowitsch `MatCreateNest()`, `MatNestSetSubMats()` 1267900e7ff2SJed Brown @*/ 1268d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetISs(Mat A, IS rows[], IS cols[]) 1269d71ae5a4SJacob Faibussowitsch { 1270900e7ff2SJed Brown PetscFunctionBegin; 1271900e7ff2SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1272cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetISs_C", (Mat, IS[], IS[]), (A, rows, cols)); 12733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1274900e7ff2SJed Brown } 1275900e7ff2SJed Brown 1276d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestGetLocalISs_Nest(Mat A, IS rows[], IS cols[]) 1277d71ae5a4SJacob Faibussowitsch { 1278900e7ff2SJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 1279900e7ff2SJed Brown PetscInt i; 1280900e7ff2SJed Brown 1281900e7ff2SJed Brown PetscFunctionBegin; 12829371c9d4SSatish Balay if (rows) 12839371c9d4SSatish Balay for (i = 0; i < vs->nr; i++) rows[i] = vs->islocal.row[i]; 12849371c9d4SSatish Balay if (cols) 12859371c9d4SSatish Balay for (i = 0; i < vs->nc; i++) cols[i] = vs->islocal.col[i]; 12863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1287900e7ff2SJed Brown } 1288900e7ff2SJed Brown 1289900e7ff2SJed Brown /*@C 129011a5261eSBarry Smith MatNestGetLocalISs - Returns the index sets partitioning the row and column spaces of a `MATNEST` 1291900e7ff2SJed Brown 12922ef1f0ffSBarry Smith Not Collective 1293900e7ff2SJed Brown 1294f899ff85SJose E. Roman Input Parameter: 129511a5261eSBarry Smith . A - `MATNEST` matrix 1296900e7ff2SJed Brown 1297d8d19677SJose E. Roman Output Parameters: 12982ef1f0ffSBarry Smith + rows - array of row index sets (or `NULL` to ignore) 12992ef1f0ffSBarry Smith - cols - array of column index sets (or `NULL` to ignore) 1300900e7ff2SJed Brown 1301900e7ff2SJed Brown Level: advanced 1302900e7ff2SJed Brown 130311a5261eSBarry Smith Note: 13042ef1f0ffSBarry Smith The user must have allocated arrays of the correct size. The reference count is not increased on the returned `IS`s. 1305900e7ff2SJed Brown 13061cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatNestGetSubMat()`, `MatNestGetSubMats()`, `MatNestGetSize()`, `MatNestGetISs()`, `MatCreateNest()`, 1307fe59aa6dSJacob Faibussowitsch `MatNestSetSubMats()`, `MatNestSetSubMat()` 1308900e7ff2SJed Brown @*/ 1309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestGetLocalISs(Mat A, IS rows[], IS cols[]) 1310d71ae5a4SJacob Faibussowitsch { 1311900e7ff2SJed Brown PetscFunctionBegin; 1312900e7ff2SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 1313cac4c232SBarry Smith PetscUseMethod(A, "MatNestGetLocalISs_C", (Mat, IS[], IS[]), (A, rows, cols)); 13143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1315900e7ff2SJed Brown } 1316900e7ff2SJed Brown 131766976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetVecType_Nest(Mat A, VecType vtype) 1318d71ae5a4SJacob Faibussowitsch { 1319207556f9SJed Brown PetscBool flg; 1320207556f9SJed Brown 1321207556f9SJed Brown PetscFunctionBegin; 13229566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, VECNEST, &flg)); 1323207556f9SJed Brown /* In reality, this only distinguishes VECNEST and "other" */ 13242a7a6963SBarry Smith if (flg) A->ops->getvecs = MatCreateVecs_Nest; 132512b53f24SSatish Balay else A->ops->getvecs = (PetscErrorCode(*)(Mat, Vec *, Vec *))0; 13263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1327207556f9SJed Brown } 1328207556f9SJed Brown 1329207556f9SJed Brown /*@C 133011a5261eSBarry Smith MatNestSetVecType - Sets the type of `Vec` returned by `MatCreateVecs()` 1331207556f9SJed Brown 13322ef1f0ffSBarry Smith Not Collective 1333207556f9SJed Brown 1334207556f9SJed Brown Input Parameters: 133511a5261eSBarry Smith + A - `MATNEST` matrix 133611a5261eSBarry Smith - vtype - `VecType` to use for creating vectors 1337207556f9SJed Brown 1338207556f9SJed Brown Level: developer 1339207556f9SJed Brown 1340fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreateVecs()`, `MatCreateNest()`, `VecType` 1341207556f9SJed Brown @*/ 1342d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetVecType(Mat A, VecType vtype) 1343d71ae5a4SJacob Faibussowitsch { 1344207556f9SJed Brown PetscFunctionBegin; 1345cac4c232SBarry Smith PetscTryMethod(A, "MatNestSetVecType_C", (Mat, VecType), (A, vtype)); 13463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1347207556f9SJed Brown } 1348207556f9SJed Brown 134966976f2fSJacob Faibussowitsch static PetscErrorCode MatNestSetSubMats_Nest(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[]) 1350d71ae5a4SJacob Faibussowitsch { 1351c8883902SJed Brown Mat_Nest *s = (Mat_Nest *)A->data; 1352c8883902SJed Brown PetscInt i, j, m, n, M, N; 135388ffe2e8SJose E. Roman PetscBool cong, isstd, sametype = PETSC_FALSE; 135488ffe2e8SJose E. Roman VecType vtype, type; 1355d8588912SDave May 1356d8588912SDave May PetscFunctionBegin; 13579566063dSJacob Faibussowitsch PetscCall(MatReset_Nest(A)); 135806a1af2fSStefano Zampini 1359c8883902SJed Brown s->nr = nr; 1360c8883902SJed Brown s->nc = nc; 1361d8588912SDave May 1362c8883902SJed Brown /* Create space for submatrices */ 13639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &s->m)); 13648068ee9dSPierre Jolivet PetscCall(PetscMalloc1(nr * nc, &s->m[0])); 1365c8883902SJed Brown for (i = 0; i < nr; i++) { 13668068ee9dSPierre Jolivet s->m[i] = s->m[0] + i * nc; 1367c8883902SJed Brown for (j = 0; j < nc; j++) { 1368c8883902SJed Brown s->m[i][j] = a[i * nc + j]; 136948a46eb9SPierre Jolivet if (a[i * nc + j]) PetscCall(PetscObjectReference((PetscObject)a[i * nc + j])); 1370d8588912SDave May } 1371d8588912SDave May } 13729566063dSJacob Faibussowitsch PetscCall(MatGetVecType(A, &vtype)); 13739566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, VECSTANDARD, &isstd)); 137488ffe2e8SJose E. Roman if (isstd) { 137588ffe2e8SJose E. Roman /* check if all blocks have the same vectype */ 137688ffe2e8SJose E. Roman vtype = NULL; 137788ffe2e8SJose E. Roman for (i = 0; i < nr; i++) { 137888ffe2e8SJose E. Roman for (j = 0; j < nc; j++) { 137988ffe2e8SJose E. Roman if (a[i * nc + j]) { 138088ffe2e8SJose E. Roman if (!vtype) { /* first visited block */ 13819566063dSJacob Faibussowitsch PetscCall(MatGetVecType(a[i * nc + j], &vtype)); 138288ffe2e8SJose E. Roman sametype = PETSC_TRUE; 138388ffe2e8SJose E. Roman } else if (sametype) { 13849566063dSJacob Faibussowitsch PetscCall(MatGetVecType(a[i * nc + j], &type)); 13859566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(vtype, type, &sametype)); 138688ffe2e8SJose E. Roman } 138788ffe2e8SJose E. Roman } 138888ffe2e8SJose E. Roman } 138988ffe2e8SJose E. Roman } 139088ffe2e8SJose E. Roman if (sametype) { /* propagate vectype */ 13919566063dSJacob Faibussowitsch PetscCall(MatSetVecType(A, vtype)); 139288ffe2e8SJose E. Roman } 139388ffe2e8SJose E. Roman } 1394d8588912SDave May 13959566063dSJacob Faibussowitsch PetscCall(MatSetUp_NestIS_Private(A, nr, is_row, nc, is_col)); 1396d8588912SDave May 13979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &s->row_len)); 13989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nc, &s->col_len)); 1399c8883902SJed Brown for (i = 0; i < nr; i++) s->row_len[i] = -1; 1400c8883902SJed Brown for (j = 0; j < nc; j++) s->col_len[j] = -1; 1401d8588912SDave May 14029566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr * nc, &s->nnzstate)); 140306a1af2fSStefano Zampini for (i = 0; i < nr; i++) { 140406a1af2fSStefano Zampini for (j = 0; j < nc; j++) { 140548a46eb9SPierre Jolivet if (s->m[i][j]) PetscCall(MatGetNonzeroState(s->m[i][j], &s->nnzstate[i * nc + j])); 140606a1af2fSStefano Zampini } 140706a1af2fSStefano Zampini } 140806a1af2fSStefano Zampini 14099566063dSJacob Faibussowitsch PetscCall(MatNestGetSizes_Private(A, &m, &n, &M, &N)); 1410d8588912SDave May 14119566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetSize(A->rmap, M)); 14129566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(A->rmap, m)); 14139566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetSize(A->cmap, N)); 14149566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(A->cmap, n)); 1415c8883902SJed Brown 14169566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 14179566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 1418c8883902SJed Brown 141906a1af2fSStefano Zampini /* disable operations that are not supported for non-square matrices, 142006a1af2fSStefano Zampini or matrices for which is_row != is_col */ 14219566063dSJacob Faibussowitsch PetscCall(MatHasCongruentLayouts(A, &cong)); 142206a1af2fSStefano Zampini if (cong && nr != nc) cong = PETSC_FALSE; 142306a1af2fSStefano Zampini if (cong) { 142448a46eb9SPierre Jolivet for (i = 0; cong && i < nr; i++) PetscCall(ISEqualUnsorted(s->isglobal.row[i], s->isglobal.col[i], &cong)); 142506a1af2fSStefano Zampini } 142606a1af2fSStefano Zampini if (!cong) { 1427381b8e50SStefano Zampini A->ops->missingdiagonal = NULL; 142806a1af2fSStefano Zampini A->ops->getdiagonal = NULL; 142906a1af2fSStefano Zampini A->ops->shift = NULL; 143006a1af2fSStefano Zampini A->ops->diagonalset = NULL; 143106a1af2fSStefano Zampini } 143206a1af2fSStefano Zampini 14339566063dSJacob Faibussowitsch PetscCall(PetscCalloc2(nr, &s->left, nc, &s->right)); 14349566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 143506a1af2fSStefano Zampini A->nonzerostate++; 14363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1437d8588912SDave May } 1438d8588912SDave May 1439c8883902SJed Brown /*@ 144011a5261eSBarry Smith MatNestSetSubMats - Sets the nested submatrices in a `MATNEST` 1441c8883902SJed Brown 1442c3339decSBarry Smith Collective 1443c8883902SJed Brown 1444d8d19677SJose E. Roman Input Parameters: 144511a5261eSBarry Smith + A - `MATNEST` matrix 1446c8883902SJed Brown . nr - number of nested row blocks 14472ef1f0ffSBarry Smith . is_row - index sets for each nested row block, or `NULL` to make contiguous 1448c8883902SJed Brown . nc - number of nested column blocks 14492ef1f0ffSBarry Smith . is_col - index sets for each nested column block, or `NULL` to make contiguous 1450e9d3347aSJose E. Roman - a - array of nr*nc submatrices, empty submatrices can be passed using `NULL` 14512ef1f0ffSBarry Smith 14522ef1f0ffSBarry Smith Level: advanced 1453c8883902SJed Brown 1454e9d3347aSJose E. Roman Notes: 145511a5261eSBarry Smith This always resets any submatrix information previously set 145606a1af2fSStefano Zampini 1457e9d3347aSJose E. Roman In both C and Fortran, `a` must be a row-major order array containing the matrices. See 1458e9d3347aSJose E. Roman `MatCreateNest()` for an example. 1459e9d3347aSJose E. Roman 14601cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreateNest()`, `MatNestSetSubMat()`, `MatNestGetSubMat()`, `MatNestGetSubMats()` 1461c8883902SJed Brown @*/ 1462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNestSetSubMats(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[]) 1463d71ae5a4SJacob Faibussowitsch { 146406a1af2fSStefano Zampini PetscInt i; 1465c8883902SJed Brown 1466c8883902SJed Brown PetscFunctionBegin; 1467c8883902SJed Brown PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 146808401ef6SPierre Jolivet PetscCheck(nr >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Number of rows cannot be negative"); 1469c8883902SJed Brown if (nr && is_row) { 14704f572ea9SToby Isaac PetscAssertPointer(is_row, 3); 1471c8883902SJed Brown for (i = 0; i < nr; i++) PetscValidHeaderSpecific(is_row[i], IS_CLASSID, 3); 1472c8883902SJed Brown } 147308401ef6SPierre Jolivet PetscCheck(nc >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Number of columns cannot be negative"); 14741664e352SJed Brown if (nc && is_col) { 14754f572ea9SToby Isaac PetscAssertPointer(is_col, 5); 14769b30a8f6SBarry Smith for (i = 0; i < nc; i++) PetscValidHeaderSpecific(is_col[i], IS_CLASSID, 5); 1477c8883902SJed Brown } 14784f572ea9SToby Isaac if (nr * nc > 0) PetscAssertPointer(a, 6); 1479cac4c232SBarry Smith PetscUseMethod(A, "MatNestSetSubMats_C", (Mat, PetscInt, const IS[], PetscInt, const IS[], const Mat[]), (A, nr, is_row, nc, is_col, a)); 14803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1481c8883902SJed Brown } 1482d8588912SDave May 1483d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatNestCreateAggregateL2G_Private(Mat A, PetscInt n, const IS islocal[], const IS isglobal[], PetscBool colflg, ISLocalToGlobalMapping *ltog) 1484d71ae5a4SJacob Faibussowitsch { 148577019fcaSJed Brown PetscBool flg; 148677019fcaSJed Brown PetscInt i, j, m, mi, *ix; 148777019fcaSJed Brown 148877019fcaSJed Brown PetscFunctionBegin; 1489aea6d515SStefano Zampini *ltog = NULL; 149077019fcaSJed Brown for (i = 0, m = 0, flg = PETSC_FALSE; i < n; i++) { 149177019fcaSJed Brown if (islocal[i]) { 14929566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(islocal[i], &mi)); 149377019fcaSJed Brown flg = PETSC_TRUE; /* We found a non-trivial entry */ 149477019fcaSJed Brown } else { 14959566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mi)); 149677019fcaSJed Brown } 149777019fcaSJed Brown m += mi; 149877019fcaSJed Brown } 14993ba16761SJacob Faibussowitsch if (!flg) PetscFunctionReturn(PETSC_SUCCESS); 1500aea6d515SStefano Zampini 15019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ix)); 1502165cd838SBarry Smith for (i = 0, m = 0; i < n; i++) { 15030298fd71SBarry Smith ISLocalToGlobalMapping smap = NULL; 1504e108cb99SStefano Zampini Mat sub = NULL; 1505f6d38dbbSStefano Zampini PetscSF sf; 1506f6d38dbbSStefano Zampini PetscLayout map; 1507aea6d515SStefano Zampini const PetscInt *ix2; 150877019fcaSJed Brown 1509165cd838SBarry Smith if (!colflg) { 15109566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 151177019fcaSJed Brown } else { 15129566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, i, &sub)); 151377019fcaSJed Brown } 1514191fd14bSBarry Smith if (sub) { 1515191fd14bSBarry Smith if (!colflg) { 15169566063dSJacob Faibussowitsch PetscCall(MatGetLocalToGlobalMapping(sub, &smap, NULL)); 1517191fd14bSBarry Smith } else { 15189566063dSJacob Faibussowitsch PetscCall(MatGetLocalToGlobalMapping(sub, NULL, &smap)); 1519191fd14bSBarry Smith } 1520191fd14bSBarry Smith } 152177019fcaSJed Brown /* 152277019fcaSJed Brown Now we need to extract the monolithic global indices that correspond to the given split global indices. 152377019fcaSJed Brown In many/most cases, we only want MatGetLocalSubMatrix() to work, in which case we only need to know the size of the local spaces. 152477019fcaSJed Brown */ 15259566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isglobal[i], &ix2)); 1526aea6d515SStefano Zampini if (islocal[i]) { 1527aea6d515SStefano Zampini PetscInt *ilocal, *iremote; 1528aea6d515SStefano Zampini PetscInt mil, nleaves; 1529aea6d515SStefano Zampini 15309566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(islocal[i], &mi)); 153128b400f6SJacob Faibussowitsch PetscCheck(smap, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "Missing local to global map"); 1532aea6d515SStefano Zampini for (j = 0; j < mi; j++) ix[m + j] = j; 15339566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingApply(smap, mi, ix + m, ix + m)); 1534aea6d515SStefano Zampini 1535aea6d515SStefano Zampini /* PetscSFSetGraphLayout does not like negative indices */ 15369566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mi, &ilocal, mi, &iremote)); 1537aea6d515SStefano Zampini for (j = 0, nleaves = 0; j < mi; j++) { 1538aea6d515SStefano Zampini if (ix[m + j] < 0) continue; 1539aea6d515SStefano Zampini ilocal[nleaves] = j; 1540aea6d515SStefano Zampini iremote[nleaves] = ix[m + j]; 1541aea6d515SStefano Zampini nleaves++; 1542aea6d515SStefano Zampini } 15439566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mil)); 15449566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PetscObjectComm((PetscObject)A), &sf)); 15459566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreate(PetscObjectComm((PetscObject)A), &map)); 15469566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetLocalSize(map, mil)); 15479566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(map)); 15489566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraphLayout(sf, map, nleaves, ilocal, PETSC_USE_POINTER, iremote)); 15499566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&map)); 15509566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sf, MPIU_INT, ix2, ix + m, MPI_REPLACE)); 15519566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sf, MPIU_INT, ix2, ix + m, MPI_REPLACE)); 15529566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sf)); 15539566063dSJacob Faibussowitsch PetscCall(PetscFree2(ilocal, iremote)); 1554aea6d515SStefano Zampini } else { 15559566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isglobal[i], &mi)); 1556aea6d515SStefano Zampini for (j = 0; j < mi; j++) ix[m + j] = ix2[i]; 1557aea6d515SStefano Zampini } 15589566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isglobal[i], &ix2)); 155977019fcaSJed Brown m += mi; 156077019fcaSJed Brown } 15619566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PetscObjectComm((PetscObject)A), 1, m, ix, PETSC_OWN_POINTER, ltog)); 15623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 156377019fcaSJed Brown } 156477019fcaSJed Brown 1565d8588912SDave May /* If an IS was provided, there is nothing Nest needs to do, otherwise Nest will build a strided IS */ 1566d8588912SDave May /* 1567d8588912SDave May nprocessors = NP 1568d8588912SDave May Nest x^T = ((g_0,g_1,...g_nprocs-1), (h_0,h_1,...h_NP-1)) 1569d8588912SDave May proc 0: => (g_0,h_0,) 1570d8588912SDave May proc 1: => (g_1,h_1,) 1571d8588912SDave May ... 1572d8588912SDave May proc nprocs-1: => (g_NP-1,h_NP-1,) 1573d8588912SDave May 1574d8588912SDave May proc 0: proc 1: proc nprocs-1: 1575d8588912SDave May is[0] = (0,1,2,...,nlocal(g_0)-1) (0,1,...,nlocal(g_1)-1) (0,1,...,nlocal(g_NP-1)) 1576d8588912SDave May 1577d8588912SDave May proc 0: 1578d8588912SDave May is[1] = (nlocal(g_0),nlocal(g_0)+1,...,nlocal(g_0)+nlocal(h_0)-1) 1579d8588912SDave May proc 1: 1580d8588912SDave May is[1] = (nlocal(g_1),nlocal(g_1)+1,...,nlocal(g_1)+nlocal(h_1)-1) 1581d8588912SDave May 1582d8588912SDave May proc NP-1: 1583d8588912SDave May is[1] = (nlocal(g_NP-1),nlocal(g_NP-1)+1,...,nlocal(g_NP-1)+nlocal(h_NP-1)-1) 1584d8588912SDave May */ 1585d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetUp_NestIS_Private(Mat A, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[]) 1586d71ae5a4SJacob Faibussowitsch { 1587e2d7f03fSJed Brown Mat_Nest *vs = (Mat_Nest *)A->data; 15888188e55aSJed Brown PetscInt i, j, offset, n, nsum, bs; 15890298fd71SBarry Smith Mat sub = NULL; 1590d8588912SDave May 1591d8588912SDave May PetscFunctionBegin; 15929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr, &vs->isglobal.row)); 15939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nc, &vs->isglobal.col)); 1594d8588912SDave May if (is_row) { /* valid IS is passed in */ 1595a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1596e2d7f03fSJed Brown for (i = 0; i < vs->nr; i++) { 15979566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)is_row[i])); 159826fbe8dcSKarl Rupp 1599e2d7f03fSJed Brown vs->isglobal.row[i] = is_row[i]; 1600d8588912SDave May } 16012ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each row */ 16028188e55aSJed Brown nsum = 0; 16038188e55aSJed Brown for (i = 0; i < vs->nr; i++) { /* Add up the local sizes to compute the aggregate offset */ 16049566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 160528b400f6SJacob Faibussowitsch PetscCheck(sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "No nonzero submatrix in row %" PetscInt_FMT, i); 16069566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, &n, NULL)); 160708401ef6SPierre Jolivet PetscCheck(n >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Sizes have not yet been set for submatrix"); 16088188e55aSJed Brown nsum += n; 16098188e55aSJed Brown } 16109566063dSJacob Faibussowitsch PetscCallMPI(MPI_Scan(&nsum, &offset, 1, MPIU_INT, MPI_SUM, PetscObjectComm((PetscObject)A))); 161130bc264bSJed Brown offset -= nsum; 1612e2d7f03fSJed Brown for (i = 0; i < vs->nr; i++) { 16139566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 16149566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, &n, NULL)); 16159566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, &bs, NULL)); 16169566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PetscObjectComm((PetscObject)sub), n, offset, 1, &vs->isglobal.row[i])); 16179566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(vs->isglobal.row[i], bs)); 16182ae74bdbSJed Brown offset += n; 1619d8588912SDave May } 1620d8588912SDave May } 1621d8588912SDave May 1622d8588912SDave May if (is_col) { /* valid IS is passed in */ 1623a5b23f4aSJose E. Roman /* refs on is[] are incremented */ 1624e2d7f03fSJed Brown for (j = 0; j < vs->nc; j++) { 16259566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)is_col[j])); 162626fbe8dcSKarl Rupp 1627e2d7f03fSJed Brown vs->isglobal.col[j] = is_col[j]; 1628d8588912SDave May } 16292ae74bdbSJed Brown } else { /* Create the ISs by inspecting sizes of a submatrix in each column */ 16302ae74bdbSJed Brown offset = A->cmap->rstart; 16318188e55aSJed Brown nsum = 0; 16328188e55aSJed Brown for (j = 0; j < vs->nc; j++) { 16339566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, j, &sub)); 163428b400f6SJacob Faibussowitsch PetscCheck(sub, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "No nonzero submatrix in column %" PetscInt_FMT, i); 16359566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, NULL, &n)); 163608401ef6SPierre Jolivet PetscCheck(n >= 0, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Sizes have not yet been set for submatrix"); 16378188e55aSJed Brown nsum += n; 16388188e55aSJed Brown } 16399566063dSJacob Faibussowitsch PetscCallMPI(MPI_Scan(&nsum, &offset, 1, MPIU_INT, MPI_SUM, PetscObjectComm((PetscObject)A))); 164030bc264bSJed Brown offset -= nsum; 1641e2d7f03fSJed Brown for (j = 0; j < vs->nc; j++) { 16429566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, j, &sub)); 16439566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(sub, NULL, &n)); 16449566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, NULL, &bs)); 16459566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PetscObjectComm((PetscObject)sub), n, offset, 1, &vs->isglobal.col[j])); 16469566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(vs->isglobal.col[j], bs)); 16472ae74bdbSJed Brown offset += n; 1648d8588912SDave May } 1649d8588912SDave May } 1650e2d7f03fSJed Brown 1651e2d7f03fSJed Brown /* Set up the local ISs */ 16529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(vs->nr, &vs->islocal.row)); 16539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(vs->nc, &vs->islocal.col)); 1654e2d7f03fSJed Brown for (i = 0, offset = 0; i < vs->nr; i++) { 1655e2d7f03fSJed Brown IS isloc; 16560298fd71SBarry Smith ISLocalToGlobalMapping rmap = NULL; 1657e2d7f03fSJed Brown PetscInt nlocal, bs; 16589566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatRow(A, i, &sub)); 16599566063dSJacob Faibussowitsch if (sub) PetscCall(MatGetLocalToGlobalMapping(sub, &rmap, NULL)); 1660207556f9SJed Brown if (rmap) { 16619566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, &bs, NULL)); 16629566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingGetSize(rmap, &nlocal)); 16639566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, nlocal, offset, 1, &isloc)); 16649566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isloc, bs)); 1665207556f9SJed Brown } else { 1666207556f9SJed Brown nlocal = 0; 16670298fd71SBarry Smith isloc = NULL; 1668207556f9SJed Brown } 1669e2d7f03fSJed Brown vs->islocal.row[i] = isloc; 1670e2d7f03fSJed Brown offset += nlocal; 1671e2d7f03fSJed Brown } 16728188e55aSJed Brown for (i = 0, offset = 0; i < vs->nc; i++) { 1673e2d7f03fSJed Brown IS isloc; 16740298fd71SBarry Smith ISLocalToGlobalMapping cmap = NULL; 1675e2d7f03fSJed Brown PetscInt nlocal, bs; 16769566063dSJacob Faibussowitsch PetscCall(MatNestFindNonzeroSubMatCol(A, i, &sub)); 16779566063dSJacob Faibussowitsch if (sub) PetscCall(MatGetLocalToGlobalMapping(sub, NULL, &cmap)); 1678207556f9SJed Brown if (cmap) { 16799566063dSJacob Faibussowitsch PetscCall(MatGetBlockSizes(sub, NULL, &bs)); 16809566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingGetSize(cmap, &nlocal)); 16819566063dSJacob Faibussowitsch PetscCall(ISCreateStride(PETSC_COMM_SELF, nlocal, offset, 1, &isloc)); 16829566063dSJacob Faibussowitsch PetscCall(ISSetBlockSize(isloc, bs)); 1683207556f9SJed Brown } else { 1684207556f9SJed Brown nlocal = 0; 16850298fd71SBarry Smith isloc = NULL; 1686207556f9SJed Brown } 1687e2d7f03fSJed Brown vs->islocal.col[i] = isloc; 1688e2d7f03fSJed Brown offset += nlocal; 1689e2d7f03fSJed Brown } 16900189643fSJed Brown 169177019fcaSJed Brown /* Set up the aggregate ISLocalToGlobalMapping */ 169277019fcaSJed Brown { 169345b6f7e9SBarry Smith ISLocalToGlobalMapping rmap, cmap; 16949566063dSJacob Faibussowitsch PetscCall(MatNestCreateAggregateL2G_Private(A, vs->nr, vs->islocal.row, vs->isglobal.row, PETSC_FALSE, &rmap)); 16959566063dSJacob Faibussowitsch PetscCall(MatNestCreateAggregateL2G_Private(A, vs->nc, vs->islocal.col, vs->isglobal.col, PETSC_TRUE, &cmap)); 16969566063dSJacob Faibussowitsch if (rmap && cmap) PetscCall(MatSetLocalToGlobalMapping(A, rmap, cmap)); 16979566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&rmap)); 16989566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingDestroy(&cmap)); 169977019fcaSJed Brown } 170077019fcaSJed Brown 170176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 17020189643fSJed Brown for (i = 0; i < vs->nr; i++) { 17030189643fSJed Brown for (j = 0; j < vs->nc; j++) { 17040189643fSJed Brown PetscInt m, n, M, N, mi, ni, Mi, Ni; 17050189643fSJed Brown Mat B = vs->m[i][j]; 17060189643fSJed Brown if (!B) continue; 17079566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &M, &N)); 17089566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(B, &m, &n)); 17099566063dSJacob Faibussowitsch PetscCall(ISGetSize(vs->isglobal.row[i], &Mi)); 17109566063dSJacob Faibussowitsch PetscCall(ISGetSize(vs->isglobal.col[j], &Ni)); 17119566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.row[i], &mi)); 17129566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(vs->isglobal.col[j], &ni)); 1713aed4548fSBarry Smith PetscCheck(M == Mi && N == Ni, PetscObjectComm((PetscObject)sub), PETSC_ERR_ARG_INCOMP, "Global sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")", M, N, i, j, Mi, Ni); 1714aed4548fSBarry Smith PetscCheck(m == mi && n == ni, PetscObjectComm((PetscObject)sub), PETSC_ERR_ARG_INCOMP, "Local sizes (%" PetscInt_FMT ",%" PetscInt_FMT ") of nested submatrix (%" PetscInt_FMT ",%" PetscInt_FMT ") do not agree with space defined by index sets (%" PetscInt_FMT ",%" PetscInt_FMT ")", m, n, i, j, mi, ni); 17150189643fSJed Brown } 17160189643fSJed Brown } 171776bd3646SJed Brown } 1718a061e289SJed Brown 1719a061e289SJed Brown /* Set A->assembled if all non-null blocks are currently assembled */ 1720a061e289SJed Brown for (i = 0; i < vs->nr; i++) { 1721a061e289SJed Brown for (j = 0; j < vs->nc; j++) { 17223ba16761SJacob Faibussowitsch if (vs->m[i][j] && !vs->m[i][j]->assembled) PetscFunctionReturn(PETSC_SUCCESS); 1723a061e289SJed Brown } 1724a061e289SJed Brown } 1725a061e289SJed Brown A->assembled = PETSC_TRUE; 17263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1727d8588912SDave May } 1728d8588912SDave May 172945c38901SJed Brown /*@C 173011a5261eSBarry Smith MatCreateNest - Creates a new `MATNEST` matrix containing several nested submatrices, each stored separately 1731659c6bb0SJed Brown 173211a5261eSBarry Smith Collective 1733659c6bb0SJed Brown 1734d8d19677SJose E. Roman Input Parameters: 173511a5261eSBarry Smith + comm - Communicator for the new `MATNEST` 1736659c6bb0SJed Brown . nr - number of nested row blocks 17372ef1f0ffSBarry Smith . is_row - index sets for each nested row block, or `NULL` to make contiguous 1738659c6bb0SJed Brown . nc - number of nested column blocks 17392ef1f0ffSBarry Smith . is_col - index sets for each nested column block, or `NULL` to make contiguous 1740e9d3347aSJose E. Roman - a - array of nr*nc submatrices, empty submatrices can be passed using `NULL` 1741659c6bb0SJed Brown 1742659c6bb0SJed Brown Output Parameter: 1743659c6bb0SJed Brown . B - new matrix 1744659c6bb0SJed Brown 1745e9d3347aSJose E. Roman Note: 1746e9d3347aSJose E. Roman In both C and Fortran, `a` must be a row-major order array holding references to the matrices. 1747e9d3347aSJose E. Roman For instance, to represent the matrix 1748e9d3347aSJose E. Roman $\begin{bmatrix} A_{11} & A_{12} \\ A_{21} & A_{22}\end{bmatrix}$ 1749e9d3347aSJose E. Roman one should use `Mat a[4]={A11,A12,A21,A22}`. 1750e9d3347aSJose E. Roman 1751659c6bb0SJed Brown Level: advanced 1752659c6bb0SJed Brown 17531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreate()`, `VecCreateNest()`, `DMCreateMatrix()`, `MatNestSetSubMat()`, 1754db781477SPatrick Sanan `MatNestGetSubMat()`, `MatNestGetLocalISs()`, `MatNestGetSize()`, 1755db781477SPatrick Sanan `MatNestGetISs()`, `MatNestSetSubMats()`, `MatNestGetSubMats()` 1756659c6bb0SJed Brown @*/ 1757d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateNest(MPI_Comm comm, PetscInt nr, const IS is_row[], PetscInt nc, const IS is_col[], const Mat a[], Mat *B) 1758d71ae5a4SJacob Faibussowitsch { 1759d8588912SDave May Mat A; 1760d8588912SDave May 1761d8588912SDave May PetscFunctionBegin; 1762f4259b30SLisandro Dalcin *B = NULL; 17639566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, &A)); 17649566063dSJacob Faibussowitsch PetscCall(MatSetType(A, MATNEST)); 176591a28eb3SBarry Smith A->preallocated = PETSC_TRUE; 17669566063dSJacob Faibussowitsch PetscCall(MatNestSetSubMats(A, nr, is_row, nc, is_col, a)); 1767d8588912SDave May *B = A; 17683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1769d8588912SDave May } 1770659c6bb0SJed Brown 177166976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_SeqAIJ_fast(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 1772d71ae5a4SJacob Faibussowitsch { 1773b68353e5Sstefano_zampini Mat_Nest *nest = (Mat_Nest *)A->data; 177423875855Sstefano_zampini Mat *trans; 1775b68353e5Sstefano_zampini PetscScalar **avv; 1776b68353e5Sstefano_zampini PetscScalar *vv; 1777b68353e5Sstefano_zampini PetscInt **aii, **ajj; 1778b68353e5Sstefano_zampini PetscInt *ii, *jj, *ci; 1779b68353e5Sstefano_zampini PetscInt nr, nc, nnz, i, j; 1780b68353e5Sstefano_zampini PetscBool done; 1781b68353e5Sstefano_zampini 1782b68353e5Sstefano_zampini PetscFunctionBegin; 17839566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &nr, &nc)); 1784b68353e5Sstefano_zampini if (reuse == MAT_REUSE_MATRIX) { 1785b68353e5Sstefano_zampini PetscInt rnr; 1786b68353e5Sstefano_zampini 17879566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(*newmat, 0, PETSC_FALSE, PETSC_FALSE, &rnr, (const PetscInt **)&ii, (const PetscInt **)&jj, &done)); 178828b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)A), PETSC_ERR_PLIB, "MatGetRowIJ"); 178908401ef6SPierre Jolivet PetscCheck(rnr == nr, PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "Cannot reuse matrix, wrong number of rows"); 17909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*newmat, &vv)); 1791b68353e5Sstefano_zampini } 1792b68353e5Sstefano_zampini /* extract CSR for nested SeqAIJ matrices */ 1793b68353e5Sstefano_zampini nnz = 0; 17949566063dSJacob Faibussowitsch PetscCall(PetscCalloc4(nest->nr * nest->nc, &aii, nest->nr * nest->nc, &ajj, nest->nr * nest->nc, &avv, nest->nr * nest->nc, &trans)); 1795b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1796b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1797b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1798b68353e5Sstefano_zampini if (B) { 1799b68353e5Sstefano_zampini PetscScalar *naa; 1800b68353e5Sstefano_zampini PetscInt *nii, *njj, nnr; 180123875855Sstefano_zampini PetscBool istrans; 1802b68353e5Sstefano_zampini 1803013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATTRANSPOSEVIRTUAL, &istrans)); 180423875855Sstefano_zampini if (istrans) { 180523875855Sstefano_zampini Mat Bt; 180623875855Sstefano_zampini 18079566063dSJacob Faibussowitsch PetscCall(MatTransposeGetMat(B, &Bt)); 18089566063dSJacob Faibussowitsch PetscCall(MatTranspose(Bt, MAT_INITIAL_MATRIX, &trans[i * nest->nc + j])); 180923875855Sstefano_zampini B = trans[i * nest->nc + j]; 1810013e2dc7SBarry Smith } else { 1811013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHERMITIANTRANSPOSEVIRTUAL, &istrans)); 1812013e2dc7SBarry Smith if (istrans) { 1813013e2dc7SBarry Smith Mat Bt; 1814013e2dc7SBarry Smith 1815013e2dc7SBarry Smith PetscCall(MatHermitianTransposeGetMat(B, &Bt)); 1816013e2dc7SBarry Smith PetscCall(MatHermitianTranspose(Bt, MAT_INITIAL_MATRIX, &trans[i * nest->nc + j])); 1817013e2dc7SBarry Smith B = trans[i * nest->nc + j]; 1818013e2dc7SBarry Smith } 181923875855Sstefano_zampini } 18209566063dSJacob Faibussowitsch PetscCall(MatGetRowIJ(B, 0, PETSC_FALSE, PETSC_FALSE, &nnr, (const PetscInt **)&nii, (const PetscInt **)&njj, &done)); 182128b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)B), PETSC_ERR_PLIB, "MatGetRowIJ"); 18229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(B, &naa)); 1823b68353e5Sstefano_zampini nnz += nii[nnr]; 1824b68353e5Sstefano_zampini 1825b68353e5Sstefano_zampini aii[i * nest->nc + j] = nii; 1826b68353e5Sstefano_zampini ajj[i * nest->nc + j] = njj; 1827b68353e5Sstefano_zampini avv[i * nest->nc + j] = naa; 1828b68353e5Sstefano_zampini } 1829b68353e5Sstefano_zampini } 1830b68353e5Sstefano_zampini } 1831b68353e5Sstefano_zampini if (reuse != MAT_REUSE_MATRIX) { 18329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nr + 1, &ii)); 18339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &jj)); 18349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &vv)); 1835b68353e5Sstefano_zampini } else { 183608401ef6SPierre Jolivet PetscCheck(nnz == ii[nr], PetscObjectComm((PetscObject)A), PETSC_ERR_USER, "Cannot reuse matrix, wrong number of nonzeros"); 1837b68353e5Sstefano_zampini } 1838b68353e5Sstefano_zampini 1839b68353e5Sstefano_zampini /* new row pointer */ 18409566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ii, nr + 1)); 1841b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1842b68353e5Sstefano_zampini PetscInt ncr, rst; 1843b68353e5Sstefano_zampini 18449566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &rst, NULL)); 18459566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &ncr)); 1846b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1847b68353e5Sstefano_zampini if (aii[i * nest->nc + j]) { 1848b68353e5Sstefano_zampini PetscInt *nii = aii[i * nest->nc + j]; 1849b68353e5Sstefano_zampini PetscInt ir; 1850b68353e5Sstefano_zampini 1851b68353e5Sstefano_zampini for (ir = rst; ir < ncr + rst; ++ir) { 1852b68353e5Sstefano_zampini ii[ir + 1] += nii[1] - nii[0]; 1853b68353e5Sstefano_zampini nii++; 1854b68353e5Sstefano_zampini } 1855b68353e5Sstefano_zampini } 1856b68353e5Sstefano_zampini } 1857b68353e5Sstefano_zampini } 1858b68353e5Sstefano_zampini for (i = 0; i < nr; i++) ii[i + 1] += ii[i]; 1859b68353e5Sstefano_zampini 1860b68353e5Sstefano_zampini /* construct CSR for the new matrix */ 18619566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nr, &ci)); 1862b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1863b68353e5Sstefano_zampini PetscInt ncr, rst; 1864b68353e5Sstefano_zampini 18659566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &rst, NULL)); 18669566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &ncr)); 1867b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1868b68353e5Sstefano_zampini if (aii[i * nest->nc + j]) { 1869b68353e5Sstefano_zampini PetscScalar *nvv = avv[i * nest->nc + j]; 1870b68353e5Sstefano_zampini PetscInt *nii = aii[i * nest->nc + j]; 1871b68353e5Sstefano_zampini PetscInt *njj = ajj[i * nest->nc + j]; 1872b68353e5Sstefano_zampini PetscInt ir, cst; 1873b68353e5Sstefano_zampini 18749566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.col[j], &cst, NULL)); 1875b68353e5Sstefano_zampini for (ir = rst; ir < ncr + rst; ++ir) { 1876b68353e5Sstefano_zampini PetscInt ij, rsize = nii[1] - nii[0], ist = ii[ir] + ci[ir]; 1877b68353e5Sstefano_zampini 1878b68353e5Sstefano_zampini for (ij = 0; ij < rsize; ij++) { 1879b68353e5Sstefano_zampini jj[ist + ij] = *njj + cst; 1880b68353e5Sstefano_zampini vv[ist + ij] = *nvv; 1881b68353e5Sstefano_zampini njj++; 1882b68353e5Sstefano_zampini nvv++; 1883b68353e5Sstefano_zampini } 1884b68353e5Sstefano_zampini ci[ir] += rsize; 1885b68353e5Sstefano_zampini nii++; 1886b68353e5Sstefano_zampini } 1887b68353e5Sstefano_zampini } 1888b68353e5Sstefano_zampini } 1889b68353e5Sstefano_zampini } 18909566063dSJacob Faibussowitsch PetscCall(PetscFree(ci)); 1891b68353e5Sstefano_zampini 1892b68353e5Sstefano_zampini /* restore info */ 1893b68353e5Sstefano_zampini for (i = 0; i < nest->nr; ++i) { 1894b68353e5Sstefano_zampini for (j = 0; j < nest->nc; ++j) { 1895b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 1896b68353e5Sstefano_zampini if (B) { 1897b68353e5Sstefano_zampini PetscInt nnr = 0, k = i * nest->nc + j; 189823875855Sstefano_zampini 189923875855Sstefano_zampini B = (trans[k] ? trans[k] : B); 19009566063dSJacob Faibussowitsch PetscCall(MatRestoreRowIJ(B, 0, PETSC_FALSE, PETSC_FALSE, &nnr, (const PetscInt **)&aii[k], (const PetscInt **)&ajj[k], &done)); 190128b400f6SJacob Faibussowitsch PetscCheck(done, PetscObjectComm((PetscObject)B), PETSC_ERR_PLIB, "MatRestoreRowIJ"); 19029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(B, &avv[k])); 19039566063dSJacob Faibussowitsch PetscCall(MatDestroy(&trans[k])); 1904b68353e5Sstefano_zampini } 1905b68353e5Sstefano_zampini } 1906b68353e5Sstefano_zampini } 19079566063dSJacob Faibussowitsch PetscCall(PetscFree4(aii, ajj, avv, trans)); 1908b68353e5Sstefano_zampini 1909b68353e5Sstefano_zampini /* finalize newmat */ 1910b68353e5Sstefano_zampini if (reuse == MAT_INITIAL_MATRIX) { 19119566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A), nr, nc, ii, jj, vv, newmat)); 1912b68353e5Sstefano_zampini } else if (reuse == MAT_INPLACE_MATRIX) { 1913b68353e5Sstefano_zampini Mat B; 1914b68353e5Sstefano_zampini 19159566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A), nr, nc, ii, jj, vv, &B)); 19169566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &B)); 1917b68353e5Sstefano_zampini } 19189566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*newmat, MAT_FINAL_ASSEMBLY)); 19199566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*newmat, MAT_FINAL_ASSEMBLY)); 1920b68353e5Sstefano_zampini { 1921b68353e5Sstefano_zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)((*newmat)->data); 1922b68353e5Sstefano_zampini a->free_a = PETSC_TRUE; 1923b68353e5Sstefano_zampini a->free_ij = PETSC_TRUE; 1924b68353e5Sstefano_zampini } 19253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1926b68353e5Sstefano_zampini } 1927b68353e5Sstefano_zampini 1928d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatAXPY_Dense_Nest(Mat Y, PetscScalar a, Mat X) 1929d71ae5a4SJacob Faibussowitsch { 1930be705e3aSPierre Jolivet Mat_Nest *nest = (Mat_Nest *)X->data; 1931be705e3aSPierre Jolivet PetscInt i, j, k, rstart; 1932be705e3aSPierre Jolivet PetscBool flg; 1933be705e3aSPierre Jolivet 1934be705e3aSPierre Jolivet PetscFunctionBegin; 1935be705e3aSPierre Jolivet /* Fill by row */ 1936be705e3aSPierre Jolivet for (j = 0; j < nest->nc; ++j) { 1937be705e3aSPierre Jolivet /* Using global column indices and ISAllGather() is not scalable. */ 1938be705e3aSPierre Jolivet IS bNis; 1939be705e3aSPierre Jolivet PetscInt bN; 1940be705e3aSPierre Jolivet const PetscInt *bNindices; 19419566063dSJacob Faibussowitsch PetscCall(ISAllGather(nest->isglobal.col[j], &bNis)); 19429566063dSJacob Faibussowitsch PetscCall(ISGetSize(bNis, &bN)); 19439566063dSJacob Faibussowitsch PetscCall(ISGetIndices(bNis, &bNindices)); 1944be705e3aSPierre Jolivet for (i = 0; i < nest->nr; ++i) { 1945fd8a7442SPierre Jolivet Mat B = nest->m[i][j], D = NULL; 1946be705e3aSPierre Jolivet PetscInt bm, br; 1947be705e3aSPierre Jolivet const PetscInt *bmindices; 1948be705e3aSPierre Jolivet if (!B) continue; 1949013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATTRANSPOSEVIRTUAL, MATHERMITIANTRANSPOSEVIRTUAL, "")); 1950be705e3aSPierre Jolivet if (flg) { 1951cac4c232SBarry Smith PetscTryMethod(B, "MatTransposeGetMat_C", (Mat, Mat *), (B, &D)); 1952cac4c232SBarry Smith PetscTryMethod(B, "MatHermitianTransposeGetMat_C", (Mat, Mat *), (B, &D)); 19539566063dSJacob Faibussowitsch PetscCall(MatConvert(B, ((PetscObject)D)->type_name, MAT_INITIAL_MATRIX, &D)); 1954be705e3aSPierre Jolivet B = D; 1955be705e3aSPierre Jolivet } 19569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATSEQSBAIJ, MATMPISBAIJ, "")); 1957be705e3aSPierre Jolivet if (flg) { 1958fd8a7442SPierre Jolivet if (D) PetscCall(MatConvert(D, MATBAIJ, MAT_INPLACE_MATRIX, &D)); 1959fd8a7442SPierre Jolivet else PetscCall(MatConvert(B, MATBAIJ, MAT_INITIAL_MATRIX, &D)); 1960be705e3aSPierre Jolivet B = D; 1961be705e3aSPierre Jolivet } 19629566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &bm)); 19639566063dSJacob Faibussowitsch PetscCall(ISGetIndices(nest->isglobal.row[i], &bmindices)); 19649566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(B, &rstart, NULL)); 1965be705e3aSPierre Jolivet for (br = 0; br < bm; ++br) { 1966be705e3aSPierre Jolivet PetscInt row = bmindices[br], brncols, *cols; 1967be705e3aSPierre Jolivet const PetscInt *brcols; 1968be705e3aSPierre Jolivet const PetscScalar *brcoldata; 1969be705e3aSPierre Jolivet PetscScalar *vals = NULL; 19709566063dSJacob Faibussowitsch PetscCall(MatGetRow(B, br + rstart, &brncols, &brcols, &brcoldata)); 19719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(brncols, &cols)); 1972be705e3aSPierre Jolivet for (k = 0; k < brncols; k++) cols[k] = bNindices[brcols[k]]; 1973be705e3aSPierre Jolivet /* 1974be705e3aSPierre Jolivet Nest blocks are required to be nonoverlapping -- otherwise nest and monolithic index layouts wouldn't match. 1975be705e3aSPierre Jolivet Thus, we could use INSERT_VALUES, but I prefer ADD_VALUES. 1976be705e3aSPierre Jolivet */ 1977be705e3aSPierre Jolivet if (a != 1.0) { 19789566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(brncols, &vals)); 1979be705e3aSPierre Jolivet for (k = 0; k < brncols; k++) vals[k] = a * brcoldata[k]; 19809566063dSJacob Faibussowitsch PetscCall(MatSetValues(Y, 1, &row, brncols, cols, vals, ADD_VALUES)); 19819566063dSJacob Faibussowitsch PetscCall(PetscFree(vals)); 1982be705e3aSPierre Jolivet } else { 19839566063dSJacob Faibussowitsch PetscCall(MatSetValues(Y, 1, &row, brncols, cols, brcoldata, ADD_VALUES)); 1984be705e3aSPierre Jolivet } 19859566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(B, br + rstart, &brncols, &brcols, &brcoldata)); 19869566063dSJacob Faibussowitsch PetscCall(PetscFree(cols)); 1987be705e3aSPierre Jolivet } 1988fd8a7442SPierre Jolivet if (D) PetscCall(MatDestroy(&D)); 19899566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(nest->isglobal.row[i], &bmindices)); 1990be705e3aSPierre Jolivet } 19919566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(bNis, &bNindices)); 19929566063dSJacob Faibussowitsch PetscCall(ISDestroy(&bNis)); 1993be705e3aSPierre Jolivet } 19949566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(Y, MAT_FINAL_ASSEMBLY)); 19959566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(Y, MAT_FINAL_ASSEMBLY)); 19963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1997be705e3aSPierre Jolivet } 1998be705e3aSPierre Jolivet 199966976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_AIJ(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 2000d71ae5a4SJacob Faibussowitsch { 2001629c3df2SDmitry Karpeev Mat_Nest *nest = (Mat_Nest *)A->data; 2002e30678d3SPierre Jolivet PetscInt m, n, M, N, i, j, k, *dnnz, *onnz = NULL, rstart, cstart, cend; 2003b68353e5Sstefano_zampini PetscMPIInt size; 2004629c3df2SDmitry Karpeev Mat C; 2005629c3df2SDmitry Karpeev 2006629c3df2SDmitry Karpeev PetscFunctionBegin; 20079566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)A), &size)); 2008b68353e5Sstefano_zampini if (size == 1) { /* look for a special case with SeqAIJ matrices and strided-1, contiguous, blocks */ 2009b68353e5Sstefano_zampini PetscInt nf; 2010b68353e5Sstefano_zampini PetscBool fast; 2011b68353e5Sstefano_zampini 20129566063dSJacob Faibussowitsch PetscCall(PetscStrcmp(newtype, MATAIJ, &fast)); 201348a46eb9SPierre Jolivet if (!fast) PetscCall(PetscStrcmp(newtype, MATSEQAIJ, &fast)); 2014b68353e5Sstefano_zampini for (i = 0; i < nest->nr && fast; ++i) { 2015b68353e5Sstefano_zampini for (j = 0; j < nest->nc && fast; ++j) { 2016b68353e5Sstefano_zampini Mat B = nest->m[i][j]; 2017b68353e5Sstefano_zampini if (B) { 20189566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &fast)); 201923875855Sstefano_zampini if (!fast) { 202023875855Sstefano_zampini PetscBool istrans; 202123875855Sstefano_zampini 2022013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATTRANSPOSEVIRTUAL, &istrans)); 202323875855Sstefano_zampini if (istrans) { 202423875855Sstefano_zampini Mat Bt; 202523875855Sstefano_zampini 20269566063dSJacob Faibussowitsch PetscCall(MatTransposeGetMat(B, &Bt)); 20279566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)Bt, MATSEQAIJ, &fast)); 2028013e2dc7SBarry Smith } else { 2029013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)B, MATHERMITIANTRANSPOSEVIRTUAL, &istrans)); 2030013e2dc7SBarry Smith if (istrans) { 2031013e2dc7SBarry Smith Mat Bt; 2032013e2dc7SBarry Smith 2033013e2dc7SBarry Smith PetscCall(MatHermitianTransposeGetMat(B, &Bt)); 2034013e2dc7SBarry Smith PetscCall(PetscObjectTypeCompare((PetscObject)Bt, MATSEQAIJ, &fast)); 2035013e2dc7SBarry Smith } 203623875855Sstefano_zampini } 2037b68353e5Sstefano_zampini } 2038b68353e5Sstefano_zampini } 2039b68353e5Sstefano_zampini } 2040b68353e5Sstefano_zampini } 2041b68353e5Sstefano_zampini for (i = 0, nf = 0; i < nest->nr && fast; ++i) { 20429566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)nest->isglobal.row[i], ISSTRIDE, &fast)); 2043b68353e5Sstefano_zampini if (fast) { 2044b68353e5Sstefano_zampini PetscInt f, s; 2045b68353e5Sstefano_zampini 20469566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.row[i], &f, &s)); 20479371c9d4SSatish Balay if (f != nf || s != 1) { 20489371c9d4SSatish Balay fast = PETSC_FALSE; 20499371c9d4SSatish Balay } else { 20509566063dSJacob Faibussowitsch PetscCall(ISGetSize(nest->isglobal.row[i], &f)); 2051b68353e5Sstefano_zampini nf += f; 2052b68353e5Sstefano_zampini } 2053b68353e5Sstefano_zampini } 2054b68353e5Sstefano_zampini } 2055b68353e5Sstefano_zampini for (i = 0, nf = 0; i < nest->nc && fast; ++i) { 20569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)nest->isglobal.col[i], ISSTRIDE, &fast)); 2057b68353e5Sstefano_zampini if (fast) { 2058b68353e5Sstefano_zampini PetscInt f, s; 2059b68353e5Sstefano_zampini 20609566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(nest->isglobal.col[i], &f, &s)); 20619371c9d4SSatish Balay if (f != nf || s != 1) { 20629371c9d4SSatish Balay fast = PETSC_FALSE; 20639371c9d4SSatish Balay } else { 20649566063dSJacob Faibussowitsch PetscCall(ISGetSize(nest->isglobal.col[i], &f)); 2065b68353e5Sstefano_zampini nf += f; 2066b68353e5Sstefano_zampini } 2067b68353e5Sstefano_zampini } 2068b68353e5Sstefano_zampini } 2069b68353e5Sstefano_zampini if (fast) { 20709566063dSJacob Faibussowitsch PetscCall(MatConvert_Nest_SeqAIJ_fast(A, newtype, reuse, newmat)); 20713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2072b68353e5Sstefano_zampini } 2073b68353e5Sstefano_zampini } 20749566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, &N)); 20759566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, &n)); 20769566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRangeColumn(A, &cstart, &cend)); 2077d1487292SPierre Jolivet if (reuse == MAT_REUSE_MATRIX) C = *newmat; 2078d1487292SPierre Jolivet else { 20799566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 20809566063dSJacob Faibussowitsch PetscCall(MatSetType(C, newtype)); 20819566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, M, N)); 2082629c3df2SDmitry Karpeev } 20839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * m, &dnnz)); 2084e30678d3SPierre Jolivet if (m) { 2085629c3df2SDmitry Karpeev onnz = dnnz + m; 2086629c3df2SDmitry Karpeev for (k = 0; k < m; k++) { 2087629c3df2SDmitry Karpeev dnnz[k] = 0; 2088629c3df2SDmitry Karpeev onnz[k] = 0; 2089629c3df2SDmitry Karpeev } 2090e30678d3SPierre Jolivet } 2091629c3df2SDmitry Karpeev for (j = 0; j < nest->nc; ++j) { 2092629c3df2SDmitry Karpeev IS bNis; 2093629c3df2SDmitry Karpeev PetscInt bN; 2094629c3df2SDmitry Karpeev const PetscInt *bNindices; 2095fd8a7442SPierre Jolivet PetscBool flg; 2096629c3df2SDmitry Karpeev /* Using global column indices and ISAllGather() is not scalable. */ 20979566063dSJacob Faibussowitsch PetscCall(ISAllGather(nest->isglobal.col[j], &bNis)); 20989566063dSJacob Faibussowitsch PetscCall(ISGetSize(bNis, &bN)); 20999566063dSJacob Faibussowitsch PetscCall(ISGetIndices(bNis, &bNindices)); 2100629c3df2SDmitry Karpeev for (i = 0; i < nest->nr; ++i) { 2101629c3df2SDmitry Karpeev PetscSF bmsf; 2102649b366bSFande Kong PetscSFNode *iremote; 2103fd8a7442SPierre Jolivet Mat B = nest->m[i][j], D = NULL; 2104649b366bSFande Kong PetscInt bm, *sub_dnnz, *sub_onnz, br; 2105629c3df2SDmitry Karpeev const PetscInt *bmindices; 2106629c3df2SDmitry Karpeev if (!B) continue; 21079566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(nest->isglobal.row[i], &bm)); 21089566063dSJacob Faibussowitsch PetscCall(ISGetIndices(nest->isglobal.row[i], &bmindices)); 21099566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PetscObjectComm((PetscObject)A), &bmsf)); 21109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &iremote)); 21119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &sub_dnnz)); 21129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bm, &sub_onnz)); 2113649b366bSFande Kong for (k = 0; k < bm; ++k) { 2114649b366bSFande Kong sub_dnnz[k] = 0; 2115649b366bSFande Kong sub_onnz[k] = 0; 2116649b366bSFande Kong } 2117dead4d76SPierre Jolivet PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATTRANSPOSEVIRTUAL, MATHERMITIANTRANSPOSEVIRTUAL, "")); 2118fd8a7442SPierre Jolivet if (flg) { 2119fd8a7442SPierre Jolivet PetscTryMethod(B, "MatTransposeGetMat_C", (Mat, Mat *), (B, &D)); 2120fd8a7442SPierre Jolivet PetscTryMethod(B, "MatHermitianTransposeGetMat_C", (Mat, Mat *), (B, &D)); 2121fd8a7442SPierre Jolivet PetscCall(MatConvert(B, ((PetscObject)D)->type_name, MAT_INITIAL_MATRIX, &D)); 2122fd8a7442SPierre Jolivet B = D; 2123fd8a7442SPierre Jolivet } 2124fd8a7442SPierre Jolivet PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &flg, MATSEQSBAIJ, MATMPISBAIJ, "")); 2125fd8a7442SPierre Jolivet if (flg) { 2126fd8a7442SPierre Jolivet if (D) PetscCall(MatConvert(D, MATBAIJ, MAT_INPLACE_MATRIX, &D)); 2127fd8a7442SPierre Jolivet else PetscCall(MatConvert(B, MATBAIJ, MAT_INITIAL_MATRIX, &D)); 2128fd8a7442SPierre Jolivet B = D; 2129fd8a7442SPierre Jolivet } 2130629c3df2SDmitry Karpeev /* 2131629c3df2SDmitry Karpeev Locate the owners for all of the locally-owned global row indices for this row block. 2132629c3df2SDmitry Karpeev These determine the roots of PetscSF used to communicate preallocation data to row owners. 2133629c3df2SDmitry Karpeev The roots correspond to the dnnz and onnz entries; thus, there are two roots per row. 2134629c3df2SDmitry Karpeev */ 21359566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(B, &rstart, NULL)); 2136629c3df2SDmitry Karpeev for (br = 0; br < bm; ++br) { 2137131c27b5Sprj- PetscInt row = bmindices[br], brncols, col; 2138629c3df2SDmitry Karpeev const PetscInt *brcols; 2139a4b3d3acSMatthew G Knepley PetscInt rowrel = 0; /* row's relative index on its owner rank */ 2140131c27b5Sprj- PetscMPIInt rowowner = 0; 21419566063dSJacob Faibussowitsch PetscCall(PetscLayoutFindOwnerIndex(A->rmap, row, &rowowner, &rowrel)); 2142649b366bSFande Kong /* how many roots */ 21439371c9d4SSatish Balay iremote[br].rank = rowowner; 21449371c9d4SSatish Balay iremote[br].index = rowrel; /* edge from bmdnnz to dnnz */ 2145649b366bSFande Kong /* get nonzero pattern */ 21469566063dSJacob Faibussowitsch PetscCall(MatGetRow(B, br + rstart, &brncols, &brcols, NULL)); 2147629c3df2SDmitry Karpeev for (k = 0; k < brncols; k++) { 2148629c3df2SDmitry Karpeev col = bNindices[brcols[k]]; 2149649b366bSFande Kong if (col >= A->cmap->range[rowowner] && col < A->cmap->range[rowowner + 1]) { 2150649b366bSFande Kong sub_dnnz[br]++; 2151649b366bSFande Kong } else { 2152649b366bSFande Kong sub_onnz[br]++; 2153649b366bSFande Kong } 2154629c3df2SDmitry Karpeev } 21559566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(B, br + rstart, &brncols, &brcols, NULL)); 2156629c3df2SDmitry Karpeev } 2157fd8a7442SPierre Jolivet if (D) PetscCall(MatDestroy(&D)); 21589566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(nest->isglobal.row[i], &bmindices)); 2159629c3df2SDmitry Karpeev /* bsf will have to take care of disposing of bedges. */ 21609566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraph(bmsf, m, bm, NULL, PETSC_OWN_POINTER, iremote, PETSC_OWN_POINTER)); 21619566063dSJacob Faibussowitsch PetscCall(PetscSFReduceBegin(bmsf, MPIU_INT, sub_dnnz, dnnz, MPI_SUM)); 21629566063dSJacob Faibussowitsch PetscCall(PetscSFReduceEnd(bmsf, MPIU_INT, sub_dnnz, dnnz, MPI_SUM)); 21639566063dSJacob Faibussowitsch PetscCall(PetscSFReduceBegin(bmsf, MPIU_INT, sub_onnz, onnz, MPI_SUM)); 21649566063dSJacob Faibussowitsch PetscCall(PetscSFReduceEnd(bmsf, MPIU_INT, sub_onnz, onnz, MPI_SUM)); 21659566063dSJacob Faibussowitsch PetscCall(PetscFree(sub_dnnz)); 21669566063dSJacob Faibussowitsch PetscCall(PetscFree(sub_onnz)); 21679566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&bmsf)); 2168629c3df2SDmitry Karpeev } 21699566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(bNis, &bNindices)); 21709566063dSJacob Faibussowitsch PetscCall(ISDestroy(&bNis)); 217165a4a0a3Sstefano_zampini } 217265a4a0a3Sstefano_zampini /* Resize preallocation if overestimated */ 217365a4a0a3Sstefano_zampini for (i = 0; i < m; i++) { 217465a4a0a3Sstefano_zampini dnnz[i] = PetscMin(dnnz[i], A->cmap->n); 217565a4a0a3Sstefano_zampini onnz[i] = PetscMin(onnz[i], A->cmap->N - A->cmap->n); 2176629c3df2SDmitry Karpeev } 21779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, dnnz)); 21789566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(C, 0, dnnz, 0, onnz)); 21799566063dSJacob Faibussowitsch PetscCall(PetscFree(dnnz)); 21809566063dSJacob Faibussowitsch PetscCall(MatAXPY_Dense_Nest(C, 1.0, A)); 2181d1487292SPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 21829566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &C)); 2183d1487292SPierre Jolivet } else *newmat = C; 21843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2185be705e3aSPierre Jolivet } 2186629c3df2SDmitry Karpeev 218766976f2fSJacob Faibussowitsch static PetscErrorCode MatConvert_Nest_Dense(Mat A, MatType newtype, MatReuse reuse, Mat *newmat) 2188d71ae5a4SJacob Faibussowitsch { 2189629c3df2SDmitry Karpeev Mat B; 2190be705e3aSPierre Jolivet PetscInt m, n, M, N; 2191be705e3aSPierre Jolivet 2192be705e3aSPierre Jolivet PetscFunctionBegin; 21939566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, &N)); 21949566063dSJacob Faibussowitsch PetscCall(MatGetLocalSize(A, &m, &n)); 2195be705e3aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 2196be705e3aSPierre Jolivet B = *newmat; 21979566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(B)); 2198be705e3aSPierre Jolivet } else { 21999566063dSJacob Faibussowitsch PetscCall(MatCreateDense(PetscObjectComm((PetscObject)A), m, PETSC_DECIDE, M, N, NULL, &B)); 2200629c3df2SDmitry Karpeev } 22019566063dSJacob Faibussowitsch PetscCall(MatAXPY_Dense_Nest(B, 1.0, A)); 2202be705e3aSPierre Jolivet if (reuse == MAT_INPLACE_MATRIX) { 22039566063dSJacob Faibussowitsch PetscCall(MatHeaderReplace(A, &B)); 2204be705e3aSPierre Jolivet } else if (reuse == MAT_INITIAL_MATRIX) *newmat = B; 22053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2206629c3df2SDmitry Karpeev } 2207629c3df2SDmitry Karpeev 220866976f2fSJacob Faibussowitsch static PetscErrorCode MatHasOperation_Nest(Mat mat, MatOperation op, PetscBool *has) 2209d71ae5a4SJacob Faibussowitsch { 22108b7d3b4bSBarry Smith Mat_Nest *bA = (Mat_Nest *)mat->data; 22113c6db4c4SPierre Jolivet MatOperation opAdd; 22128b7d3b4bSBarry Smith PetscInt i, j, nr = bA->nr, nc = bA->nc; 22138b7d3b4bSBarry Smith PetscBool flg; 22148b7d3b4bSBarry Smith 22154d86920dSPierre Jolivet PetscFunctionBegin; 221652c5f739Sprj- *has = PETSC_FALSE; 22173c6db4c4SPierre Jolivet if (op == MATOP_MULT || op == MATOP_MULT_ADD || op == MATOP_MULT_TRANSPOSE || op == MATOP_MULT_TRANSPOSE_ADD) { 22183c6db4c4SPierre Jolivet opAdd = (op == MATOP_MULT || op == MATOP_MULT_ADD ? MATOP_MULT_ADD : MATOP_MULT_TRANSPOSE_ADD); 22198b7d3b4bSBarry Smith for (j = 0; j < nc; j++) { 22208b7d3b4bSBarry Smith for (i = 0; i < nr; i++) { 22218b7d3b4bSBarry Smith if (!bA->m[i][j]) continue; 22229566063dSJacob Faibussowitsch PetscCall(MatHasOperation(bA->m[i][j], opAdd, &flg)); 22233ba16761SJacob Faibussowitsch if (!flg) PetscFunctionReturn(PETSC_SUCCESS); 22248b7d3b4bSBarry Smith } 22258b7d3b4bSBarry Smith } 22268b7d3b4bSBarry Smith } 22273c6db4c4SPierre Jolivet if (((void **)mat->ops)[op]) *has = PETSC_TRUE; 22283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22298b7d3b4bSBarry Smith } 22308b7d3b4bSBarry Smith 2231659c6bb0SJed Brown /*MC 22322ef1f0ffSBarry Smith MATNEST - "nest" - Matrix type consisting of nested submatrices, each stored separately. 2233659c6bb0SJed Brown 2234659c6bb0SJed Brown Level: intermediate 2235659c6bb0SJed Brown 2236659c6bb0SJed Brown Notes: 223711a5261eSBarry Smith This matrix type permits scalable use of `PCFIELDSPLIT` and avoids the large memory costs of extracting submatrices. 2238659c6bb0SJed Brown It allows the use of symmetric and block formats for parts of multi-physics simulations. 223911a5261eSBarry Smith It is usually used with `DMCOMPOSITE` and `DMCreateMatrix()` 2240659c6bb0SJed Brown 22418b7d3b4bSBarry Smith Each of the submatrices lives on the same MPI communicator as the original nest matrix (though they can have zero 22428b7d3b4bSBarry Smith rows/columns on some processes.) Thus this is not meant for cases where the submatrices live on far fewer processes 22438b7d3b4bSBarry Smith than the nest matrix. 22448b7d3b4bSBarry Smith 22451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATNEST`, `MatCreate()`, `MatType`, `MatCreateNest()`, `MatNestSetSubMat()`, `MatNestGetSubMat()`, 2246db781477SPatrick Sanan `VecCreateNest()`, `DMCreateMatrix()`, `DMCOMPOSITE`, `MatNestSetVecType()`, `MatNestGetLocalISs()`, 2247db781477SPatrick Sanan `MatNestGetISs()`, `MatNestSetSubMats()`, `MatNestGetSubMats()` 2248659c6bb0SJed Brown M*/ 2249d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_Nest(Mat A) 2250d71ae5a4SJacob Faibussowitsch { 2251c8883902SJed Brown Mat_Nest *s; 2252c8883902SJed Brown 2253c8883902SJed Brown PetscFunctionBegin; 22544dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&s)); 2255c8883902SJed Brown A->data = (void *)s; 2256e7c19651SJed Brown 2257e7c19651SJed Brown s->nr = -1; 2258e7c19651SJed Brown s->nc = -1; 22590298fd71SBarry Smith s->m = NULL; 2260e7c19651SJed Brown s->splitassembly = PETSC_FALSE; 2261c8883902SJed Brown 22629566063dSJacob Faibussowitsch PetscCall(PetscMemzero(A->ops, sizeof(*A->ops))); 226326fbe8dcSKarl Rupp 2264c8883902SJed Brown A->ops->mult = MatMult_Nest; 22659194d70fSJed Brown A->ops->multadd = MatMultAdd_Nest; 2266c8883902SJed Brown A->ops->multtranspose = MatMultTranspose_Nest; 22679194d70fSJed Brown A->ops->multtransposeadd = MatMultTransposeAdd_Nest; 2268f8170845SAlex Fikl A->ops->transpose = MatTranspose_Nest; 22690998551bSBlanca Mellado Pinto A->ops->multhermitiantranspose = MatMultHermitianTranspose_Nest; 22700998551bSBlanca Mellado Pinto A->ops->multhermitiantransposeadd = MatMultHermitianTransposeAdd_Nest; 2271c8883902SJed Brown A->ops->assemblybegin = MatAssemblyBegin_Nest; 2272c8883902SJed Brown A->ops->assemblyend = MatAssemblyEnd_Nest; 2273c8883902SJed Brown A->ops->zeroentries = MatZeroEntries_Nest; 2274c222c20dSDavid Ham A->ops->copy = MatCopy_Nest; 22756e76ffeaSPierre Jolivet A->ops->axpy = MatAXPY_Nest; 2276c8883902SJed Brown A->ops->duplicate = MatDuplicate_Nest; 22777dae84e0SHong Zhang A->ops->createsubmatrix = MatCreateSubMatrix_Nest; 2278c8883902SJed Brown A->ops->destroy = MatDestroy_Nest; 2279c8883902SJed Brown A->ops->view = MatView_Nest; 2280f4259b30SLisandro Dalcin A->ops->getvecs = NULL; /* Use VECNEST by calling MatNestSetVecType(A,VECNEST) */ 2281c8883902SJed Brown A->ops->getlocalsubmatrix = MatGetLocalSubMatrix_Nest; 2282c8883902SJed Brown A->ops->restorelocalsubmatrix = MatRestoreLocalSubMatrix_Nest; 2283429bac76SJed Brown A->ops->getdiagonal = MatGetDiagonal_Nest; 2284429bac76SJed Brown A->ops->diagonalscale = MatDiagonalScale_Nest; 2285a061e289SJed Brown A->ops->scale = MatScale_Nest; 2286a061e289SJed Brown A->ops->shift = MatShift_Nest; 228713135bc6SAlex Fikl A->ops->diagonalset = MatDiagonalSet_Nest; 2288f8170845SAlex Fikl A->ops->setrandom = MatSetRandom_Nest; 22898b7d3b4bSBarry Smith A->ops->hasoperation = MatHasOperation_Nest; 2290381b8e50SStefano Zampini A->ops->missingdiagonal = MatMissingDiagonal_Nest; 2291c8883902SJed Brown 2292f4259b30SLisandro Dalcin A->spptr = NULL; 2293c8883902SJed Brown A->assembled = PETSC_FALSE; 2294c8883902SJed Brown 2295c8883902SJed Brown /* expose Nest api's */ 22969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMat_C", MatNestGetSubMat_Nest)); 22979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMat_C", MatNestSetSubMat_Nest)); 22989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSubMats_C", MatNestGetSubMats_Nest)); 22999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetSize_C", MatNestGetSize_Nest)); 23009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetISs_C", MatNestGetISs_Nest)); 23019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestGetLocalISs_C", MatNestGetLocalISs_Nest)); 23029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetVecType_C", MatNestSetVecType_Nest)); 23039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatNestSetSubMats_C", MatNestSetSubMats_Nest)); 23049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpiaij_C", MatConvert_Nest_AIJ)); 23059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqaij_C", MatConvert_Nest_AIJ)); 23069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_aij_C", MatConvert_Nest_AIJ)); 23079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_is_C", MatConvert_Nest_IS)); 23089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_mpidense_C", MatConvert_Nest_Dense)); 23099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_nest_seqdense_C", MatConvert_Nest_Dense)); 23109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_seqdense_C", MatProductSetFromOptions_Nest_Dense)); 23119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_nest_mpidense_C", MatProductSetFromOptions_Nest_Dense)); 2312c8883902SJed Brown 23139566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, MATNEST)); 23143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2315c8883902SJed Brown } 2316