1c4762a1bSJed Brown 2c4762a1bSJed Brown static char help[] = "Extract submatrices using unsorted indices. For SEQSBAIJ either sort both rows and columns, or sort none.\n\n"; 3c4762a1bSJed Brown /* 4c4762a1bSJed Brown Take a 4x4 grid and form a 5-point stencil graph Laplacian over it. 5c4762a1bSJed Brown Partition the grid into two subdomains by splitting into two in the j-direction (slowest varying). 6c4762a1bSJed Brown Impose an overlap of 1 and order the subdomains with the j-direction varying fastest. 7c4762a1bSJed Brown Extract the subdomain submatrices, one per rank. 8c4762a1bSJed Brown */ 9c4762a1bSJed Brown /* Results: 10c4762a1bSJed Brown Sequential: 11c4762a1bSJed Brown - seqaij: will error out, if rows or columns are unsorted 12c4762a1bSJed Brown - seqbaij: will extract submatrices correctly even for unsorted row or column indices 13c4762a1bSJed Brown - seqsbaij: will extract submatrices correctly even for unsorted row and column indices (both must be sorted or not); 14c4762a1bSJed Brown CANNOT automatically report inversions, because MatGetRow is not available. 15c4762a1bSJed Brown MPI: 16c4762a1bSJed Brown - mpiaij: will error out, if columns are unsorted 17c4762a1bSJed Brown - mpibaij: will error out, if columns are unsorted. 18c4762a1bSJed Brown - mpisbaij: will error out, if columns are unsorted; even with unsorted rows will produce correct submatrices; 19c4762a1bSJed Brown CANNOT automatically report inversions, because MatGetRow is not available. 20c4762a1bSJed Brown */ 21c4762a1bSJed Brown 22c4762a1bSJed Brown #include <petscmat.h> 23c4762a1bSJed Brown #include <petscis.h> 24c4762a1bSJed Brown 25*d71ae5a4SJacob Faibussowitsch int main(int argc, char **args) 26*d71ae5a4SJacob Faibussowitsch { 27c4762a1bSJed Brown Mat A, *S; 28c4762a1bSJed Brown IS rowis[2], colis[2]; 29c4762a1bSJed Brown PetscInt n, N, i, j, k, l, nsub, Jlow[2] = {0, 1}, *jlow, Jhigh[2] = {3, 4}, *jhigh, row, col, *subindices, ncols; 30c4762a1bSJed Brown const PetscInt *cols; 31c4762a1bSJed Brown PetscScalar v; 32c4762a1bSJed Brown PetscMPIInt rank, size, p, inversions, total_inversions; 33c4762a1bSJed Brown PetscBool sort_rows, sort_cols, show_inversions; 34c4762a1bSJed Brown 35327415f7SBarry Smith PetscFunctionBeginUser; 369566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc, &args, (char *)0, help)); 379566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); 389566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD, &size)); 39be096a46SBarry Smith PetscCheck(size < 3, PETSC_COMM_WORLD, PETSC_ERR_WRONG_MPI_SIZE, "A uniprocessor or two-processor example only."); 40c4762a1bSJed Brown 419566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_WORLD, &A)); 42c4762a1bSJed Brown if (size > 1) { 439371c9d4SSatish Balay n = 8; 449371c9d4SSatish Balay N = 16; 45c4762a1bSJed Brown } else { 469371c9d4SSatish Balay n = 16; 479371c9d4SSatish Balay N = 16; 48c4762a1bSJed Brown } 499566063dSJacob Faibussowitsch PetscCall(MatSetSizes(A, n, n, N, N)); 509566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(A)); 519566063dSJacob Faibussowitsch PetscCall(MatSetUp(A)); 52c4762a1bSJed Brown 53c4762a1bSJed Brown /* Don't care if the entries are set multiple times by different procs. */ 54c4762a1bSJed Brown for (i = 0; i < 4; ++i) { 55c4762a1bSJed Brown for (j = 0; j < 4; ++j) { 56c4762a1bSJed Brown row = j * 4 + i; 57c4762a1bSJed Brown v = -1.0; 58c4762a1bSJed Brown if (i > 0) { 599371c9d4SSatish Balay col = row - 1; 609371c9d4SSatish Balay PetscCall(MatSetValues(A, 1, &row, 1, &col, &v, INSERT_VALUES)); 61c4762a1bSJed Brown } 62c4762a1bSJed Brown if (i < 3) { 639371c9d4SSatish Balay col = row + 1; 649371c9d4SSatish Balay PetscCall(MatSetValues(A, 1, &row, 1, &col, &v, INSERT_VALUES)); 65c4762a1bSJed Brown } 66c4762a1bSJed Brown if (j > 0) { 679371c9d4SSatish Balay col = row - 4; 689371c9d4SSatish Balay PetscCall(MatSetValues(A, 1, &row, 1, &col, &v, INSERT_VALUES)); 69c4762a1bSJed Brown } 70c4762a1bSJed Brown if (j < 3) { 719371c9d4SSatish Balay col = row + 4; 729371c9d4SSatish Balay PetscCall(MatSetValues(A, 1, &row, 1, &col, &v, INSERT_VALUES)); 73c4762a1bSJed Brown } 74c4762a1bSJed Brown v = 4.0; 759566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &row, 1, &row, &v, INSERT_VALUES)); 76c4762a1bSJed Brown } 77c4762a1bSJed Brown } 789566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 799566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 809566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "Original matrix\n")); 819566063dSJacob Faibussowitsch PetscCall(MatView(A, PETSC_VIEWER_STDOUT_WORLD)); 82c4762a1bSJed Brown 83c4762a1bSJed Brown if (size > 1) { 84c4762a1bSJed Brown nsub = 1; /* one subdomain per rank */ 859371c9d4SSatish Balay } else { 86c4762a1bSJed Brown nsub = 2; /* both subdomains on rank 0 */ 87c4762a1bSJed Brown } 88c4762a1bSJed Brown if (rank) { 899371c9d4SSatish Balay jlow = Jlow + 1; 909371c9d4SSatish Balay jhigh = Jhigh + 1; 919371c9d4SSatish Balay } else { 929371c9d4SSatish Balay jlow = Jlow; 939371c9d4SSatish Balay jhigh = Jhigh; 94c4762a1bSJed Brown } 95c4762a1bSJed Brown sort_rows = PETSC_FALSE; 969566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-sort_rows", &sort_rows, NULL)); 97c4762a1bSJed Brown sort_cols = PETSC_FALSE; 989566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-sort_cols", &sort_cols, NULL)); 99c4762a1bSJed Brown for (l = 0; l < nsub; ++l) { 1009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(12, &subindices)); 101c4762a1bSJed Brown k = 0; 102c4762a1bSJed Brown for (i = 0; i < 4; ++i) { 103c4762a1bSJed Brown for (j = jlow[l]; j < jhigh[l]; ++j) { 104c4762a1bSJed Brown subindices[k] = j * 4 + i; 105c4762a1bSJed Brown k++; 106c4762a1bSJed Brown } 107c4762a1bSJed Brown } 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, 12, subindices, PETSC_OWN_POINTER, rowis + l)); 109c4762a1bSJed Brown if ((sort_rows && !sort_cols) || (!sort_rows && sort_cols)) { 1109566063dSJacob Faibussowitsch PetscCall(ISDuplicate(rowis[l], colis + l)); 111c4762a1bSJed Brown } else { 1129566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)rowis[l])); 113c4762a1bSJed Brown colis[l] = rowis[l]; 114c4762a1bSJed Brown } 11548a46eb9SPierre Jolivet if (sort_rows) PetscCall(ISSort(rowis[l])); 11648a46eb9SPierre Jolivet if (sort_cols) PetscCall(ISSort(colis[l])); 117c4762a1bSJed Brown } 118c4762a1bSJed Brown 1199566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(A, nsub, rowis, colis, MAT_INITIAL_MATRIX, &S)); 120c4762a1bSJed Brown 121c4762a1bSJed Brown show_inversions = PETSC_FALSE; 122c4762a1bSJed Brown 1239566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-show_inversions", &show_inversions, NULL)); 124c4762a1bSJed Brown 125c4762a1bSJed Brown inversions = 0; 126c4762a1bSJed Brown for (p = 0; p < size; ++p) { 127c4762a1bSJed Brown if (p == rank) { 1289566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%" PetscInt_FMT ":%" PetscInt_FMT "]: Number of subdomains: %" PetscInt_FMT ":\n", rank, size, nsub)); 129c4762a1bSJed Brown for (l = 0; l < nsub; ++l) { 130c4762a1bSJed Brown PetscInt i0, i1; 1319566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%" PetscInt_FMT ":%" PetscInt_FMT "]: Subdomain row IS %" PetscInt_FMT ":\n", rank, size, l)); 1329566063dSJacob Faibussowitsch PetscCall(ISView(rowis[l], PETSC_VIEWER_STDOUT_SELF)); 1339566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%" PetscInt_FMT ":%" PetscInt_FMT "]: Subdomain col IS %" PetscInt_FMT ":\n", rank, size, l)); 1349566063dSJacob Faibussowitsch PetscCall(ISView(colis[l], PETSC_VIEWER_STDOUT_SELF)); 1359566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%" PetscInt_FMT ":%" PetscInt_FMT "]: Submatrix %" PetscInt_FMT ":\n", rank, size, l)); 1369566063dSJacob Faibussowitsch PetscCall(MatView(S[l], PETSC_VIEWER_STDOUT_SELF)); 137c4762a1bSJed Brown if (show_inversions) { 1389566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(S[l], &i0, &i1)); 139c4762a1bSJed Brown for (i = i0; i < i1; ++i) { 1409566063dSJacob Faibussowitsch PetscCall(MatGetRow(S[l], i, &ncols, &cols, NULL)); 141c4762a1bSJed Brown for (j = 1; j < ncols; ++j) { 142c4762a1bSJed Brown if (cols[j] < cols[j - 1]) { 1439566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "***Inversion in row %" PetscInt_FMT ": col[%" PetscInt_FMT "] = %" PetscInt_FMT " < %" PetscInt_FMT " = col[%" PetscInt_FMT "]\n", i, j, cols[j], cols[j - 1], j - 1)); 144c4762a1bSJed Brown inversions++; 145c4762a1bSJed Brown } 146c4762a1bSJed Brown } 1479566063dSJacob Faibussowitsch PetscCall(MatRestoreRow(S[l], i, &ncols, &cols, NULL)); 148c4762a1bSJed Brown } 149c4762a1bSJed Brown } 150c4762a1bSJed Brown } 151c4762a1bSJed Brown } 1529566063dSJacob Faibussowitsch PetscCallMPI(MPI_Barrier(PETSC_COMM_WORLD)); 153c4762a1bSJed Brown } 154c4762a1bSJed Brown if (show_inversions) { 1559566063dSJacob Faibussowitsch PetscCallMPI(MPI_Reduce(&inversions, &total_inversions, 1, MPIU_INT, MPI_SUM, 0, PETSC_COMM_WORLD)); 1569566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "*Total inversions: %" PetscInt_FMT "\n", total_inversions)); 157c4762a1bSJed Brown } 1589566063dSJacob Faibussowitsch PetscCall(MatDestroy(&A)); 159c4762a1bSJed Brown 160c4762a1bSJed Brown for (l = 0; l < nsub; ++l) { 1619566063dSJacob Faibussowitsch PetscCall(ISDestroy(&(rowis[l]))); 1629566063dSJacob Faibussowitsch PetscCall(ISDestroy(&(colis[l]))); 163c4762a1bSJed Brown } 1649566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices(nsub, &S)); 1659566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 166b122ec5aSJacob Faibussowitsch return 0; 167c4762a1bSJed Brown } 168