1c4762a1bSJed Brown 2c4762a1bSJed Brown static char help[] = "Tests MatIncreaseOverlap(), MatCreateSubMatrices() for parallel AIJ and BAIJ formats.\n"; 3c4762a1bSJed Brown 4c4762a1bSJed Brown #include <petscmat.h> 5c4762a1bSJed Brown 6d71ae5a4SJacob Faibussowitsch int main(int argc, char **args) 7d71ae5a4SJacob Faibussowitsch { 8*5a2b941aSBarry Smith Mat E, A, B, Bt, *submatA, *submatB; 9c4762a1bSJed Brown PetscInt bs = 1, m = 11, ov = 1, i, j, k, *rows, *cols, nd = 5, *idx, rstart, rend, sz, mm, nn, M, N, Mbs; 10c4762a1bSJed Brown PetscMPIInt size, rank; 11c4762a1bSJed Brown PetscScalar *vals, rval; 12c4762a1bSJed Brown IS *is1, *is2; 13c4762a1bSJed Brown PetscRandom rdm; 14c4762a1bSJed Brown Vec xx, s1, s2; 15c4762a1bSJed Brown PetscReal s1norm, s2norm, rnorm, tol = 100 * PETSC_SMALL; 1682b5ce2aSStefano Zampini PetscBool flg, test_nd0 = PETSC_FALSE, emptynd; 17c4762a1bSJed Brown 18327415f7SBarry Smith PetscFunctionBeginUser; 199566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc, &args, (char *)0, help)); 209566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD, &size)); 219566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); 22c4762a1bSJed Brown 239566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetInt(NULL, NULL, "-mat_block_size", &bs, NULL)); 249566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetInt(NULL, NULL, "-mat_size", &m, NULL)); 259566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetInt(NULL, NULL, "-ov", &ov, NULL)); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetInt(NULL, NULL, "-nd", &nd, NULL)); 279566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-test_nd0", &test_nd0, NULL)); 28c4762a1bSJed Brown 29c4762a1bSJed Brown /* Create a AIJ matrix A */ 309566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_WORLD, &A)); 319566063dSJacob Faibussowitsch PetscCall(MatSetSizes(A, m * bs, m * bs, PETSC_DECIDE, PETSC_DECIDE)); 329566063dSJacob Faibussowitsch PetscCall(MatSetType(A, MATAIJ)); 334b5966ddSBarry Smith PetscCall(MatSetBlockSize(A, bs)); 349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, PETSC_DEFAULT, NULL)); 359566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(A, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL)); 369566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(A)); 379566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE)); 38c4762a1bSJed Brown 39c4762a1bSJed Brown /* Create a BAIJ matrix B */ 409566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_WORLD, &B)); 419566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, m * bs, m * bs, PETSC_DECIDE, PETSC_DECIDE)); 429566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATBAIJ)); 439566063dSJacob Faibussowitsch PetscCall(MatSeqBAIJSetPreallocation(B, bs, PETSC_DEFAULT, NULL)); 449566063dSJacob Faibussowitsch PetscCall(MatMPIBAIJSetPreallocation(B, bs, PETSC_DEFAULT, NULL, PETSC_DEFAULT, NULL)); 459566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(B)); 469566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE)); 47c4762a1bSJed Brown 489566063dSJacob Faibussowitsch PetscCall(PetscRandomCreate(PETSC_COMM_WORLD, &rdm)); 499566063dSJacob Faibussowitsch PetscCall(PetscRandomSetFromOptions(rdm)); 50c4762a1bSJed Brown 519566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(A, &rstart, &rend)); 529566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &M, &N)); 53c4762a1bSJed Brown Mbs = M / bs; 54c4762a1bSJed Brown 559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs, &rows)); 569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs, &cols)); 579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs * bs, &vals)); 589566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &idx)); 59c4762a1bSJed Brown 60c4762a1bSJed Brown /* Now set blocks of values */ 61c4762a1bSJed Brown for (i = 0; i < 40 * bs; i++) { 624b5966ddSBarry Smith PetscInt nr = 1, nc = 1; 639566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rdm, &rval)); 64c4762a1bSJed Brown cols[0] = bs * (int)(PetscRealPart(rval) * Mbs); 659566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rdm, &rval)); 66c4762a1bSJed Brown rows[0] = rstart + bs * (int)(PetscRealPart(rval) * m); 67c4762a1bSJed Brown for (j = 1; j < bs; j++) { 684b5966ddSBarry Smith PetscCall(PetscRandomGetValue(rdm, &rval)); 694b5966ddSBarry Smith if (PetscRealPart(rval) > .5) rows[nr++] = rows[0] + j - 1; 704b5966ddSBarry Smith } 714b5966ddSBarry Smith for (j = 1; j < bs; j++) { 724b5966ddSBarry Smith PetscCall(PetscRandomGetValue(rdm, &rval)); 734b5966ddSBarry Smith if (PetscRealPart(rval) > .5) cols[nc++] = cols[0] + j - 1; 74c4762a1bSJed Brown } 75c4762a1bSJed Brown 764b5966ddSBarry Smith for (j = 0; j < nr * nc; j++) { 779566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rdm, &rval)); 78c4762a1bSJed Brown vals[j] = rval; 79c4762a1bSJed Brown } 804b5966ddSBarry Smith PetscCall(MatSetValues(A, nr, rows, nc, cols, vals, ADD_VALUES)); 814b5966ddSBarry Smith PetscCall(MatSetValues(B, nr, rows, nc, cols, vals, ADD_VALUES)); 82c4762a1bSJed Brown } 839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 859566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 869566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 87c4762a1bSJed Brown 88*5a2b941aSBarry Smith /* Test MatConvert_MPIAIJ_MPI(S)BAIJ handles incompletely filled blocks */ 894b5966ddSBarry Smith PetscCall(MatConvert(A, MATBAIJ, MAT_INITIAL_MATRIX, &E)); 904b5966ddSBarry Smith PetscCall(MatDestroy(&E)); 91*5a2b941aSBarry Smith PetscCall(MatTranspose(A, MAT_INITIAL_MATRIX, &Bt)); 92*5a2b941aSBarry Smith PetscCall(MatAXPY(Bt, 1.0, B, DIFFERENT_NONZERO_PATTERN)); 93*5a2b941aSBarry Smith PetscCall(MatSetOption(Bt, MAT_SYMMETRIC, PETSC_TRUE)); 94*5a2b941aSBarry Smith PetscCall(MatConvert(Bt, MATSBAIJ, MAT_INITIAL_MATRIX, &E)); 95*5a2b941aSBarry Smith PetscCall(MatDestroy(&E)); 96*5a2b941aSBarry Smith PetscCall(MatDestroy(&Bt)); 974b5966ddSBarry Smith 98c4762a1bSJed Brown /* Test MatIncreaseOverlap() */ 999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nd, &is1)); 1009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nd, &is2)); 101c4762a1bSJed Brown 10282b5ce2aSStefano Zampini emptynd = PETSC_FALSE; 10382b5ce2aSStefano Zampini if (rank == 0 && test_nd0) emptynd = PETSC_TRUE; /* test case */ 104c4762a1bSJed Brown 105c4762a1bSJed Brown for (i = 0; i < nd; i++) { 1069566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rdm, &rval)); 107c4762a1bSJed Brown sz = (int)(PetscRealPart(rval) * m); 108c4762a1bSJed Brown for (j = 0; j < sz; j++) { 1099566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rdm, &rval)); 110c4762a1bSJed Brown idx[j * bs] = bs * (int)(PetscRealPart(rval) * Mbs); 111c4762a1bSJed Brown for (k = 1; k < bs; k++) idx[j * bs + k] = idx[j * bs] + k; 112c4762a1bSJed Brown } 11382b5ce2aSStefano Zampini PetscCall(ISCreateGeneral(PETSC_COMM_SELF, emptynd ? 0 : sz * bs, idx, PETSC_COPY_VALUES, is1 + i)); 11482b5ce2aSStefano Zampini PetscCall(ISCreateGeneral(PETSC_COMM_SELF, emptynd ? 0 : sz * bs, idx, PETSC_COPY_VALUES, is2 + i)); 115c4762a1bSJed Brown } 1169566063dSJacob Faibussowitsch PetscCall(MatIncreaseOverlap(A, nd, is1, ov)); 1179566063dSJacob Faibussowitsch PetscCall(MatIncreaseOverlap(B, nd, is2, ov)); 118c4762a1bSJed Brown 119c4762a1bSJed Brown for (i = 0; i < nd; ++i) { 1209566063dSJacob Faibussowitsch PetscCall(ISEqual(is1[i], is2[i], &flg)); 121c4762a1bSJed Brown 12248a46eb9SPierre Jolivet if (!flg) PetscCall(PetscPrintf(PETSC_COMM_SELF, "i=%" PetscInt_FMT ", flg=%d :bs=%" PetscInt_FMT " m=%" PetscInt_FMT " ov=%" PetscInt_FMT " nd=%" PetscInt_FMT " np=%d\n", i, flg, bs, m, ov, nd, size)); 123c4762a1bSJed Brown } 124c4762a1bSJed Brown 125c4762a1bSJed Brown for (i = 0; i < nd; ++i) { 1269566063dSJacob Faibussowitsch PetscCall(ISSort(is1[i])); 1279566063dSJacob Faibussowitsch PetscCall(ISSort(is2[i])); 128c4762a1bSJed Brown } 129c4762a1bSJed Brown 1309566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(B, nd, is2, is2, MAT_INITIAL_MATRIX, &submatB)); 1319566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(A, nd, is1, is1, MAT_INITIAL_MATRIX, &submatA)); 132c4762a1bSJed Brown 133c4762a1bSJed Brown /* Test MatMult() */ 134c4762a1bSJed Brown for (i = 0; i < nd; i++) { 1359566063dSJacob Faibussowitsch PetscCall(MatGetSize(submatA[i], &mm, &nn)); 1369566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_SELF, mm, &xx)); 1379566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xx, &s1)); 1389566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xx, &s2)); 139c4762a1bSJed Brown for (j = 0; j < 3; j++) { 1409566063dSJacob Faibussowitsch PetscCall(VecSetRandom(xx, rdm)); 1419566063dSJacob Faibussowitsch PetscCall(MatMult(submatA[i], xx, s1)); 1429566063dSJacob Faibussowitsch PetscCall(MatMult(submatB[i], xx, s2)); 1439566063dSJacob Faibussowitsch PetscCall(VecNorm(s1, NORM_2, &s1norm)); 1449566063dSJacob Faibussowitsch PetscCall(VecNorm(s2, NORM_2, &s2norm)); 145c4762a1bSJed Brown rnorm = s2norm - s1norm; 14648a46eb9SPierre Jolivet if (rnorm < -tol || rnorm > tol) PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%d]Error:MatMult - Norm1=%16.14e Norm2=%16.14e\n", rank, (double)s1norm, (double)s2norm)); 147c4762a1bSJed Brown } 1489566063dSJacob Faibussowitsch PetscCall(VecDestroy(&xx)); 1499566063dSJacob Faibussowitsch PetscCall(VecDestroy(&s1)); 1509566063dSJacob Faibussowitsch PetscCall(VecDestroy(&s2)); 151c4762a1bSJed Brown } 152c4762a1bSJed Brown 153c4762a1bSJed Brown /* Now test MatCreateSubmatrices with MAT_REUSE_MATRIX option */ 1549566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(A, nd, is1, is1, MAT_REUSE_MATRIX, &submatA)); 1559566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrices(B, nd, is2, is2, MAT_REUSE_MATRIX, &submatB)); 156c4762a1bSJed Brown 157c4762a1bSJed Brown /* Test MatMult() */ 158c4762a1bSJed Brown for (i = 0; i < nd; i++) { 1599566063dSJacob Faibussowitsch PetscCall(MatGetSize(submatA[i], &mm, &nn)); 1609566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_SELF, mm, &xx)); 1619566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xx, &s1)); 1629566063dSJacob Faibussowitsch PetscCall(VecDuplicate(xx, &s2)); 163c4762a1bSJed Brown for (j = 0; j < 3; j++) { 1649566063dSJacob Faibussowitsch PetscCall(VecSetRandom(xx, rdm)); 1659566063dSJacob Faibussowitsch PetscCall(MatMult(submatA[i], xx, s1)); 1669566063dSJacob Faibussowitsch PetscCall(MatMult(submatB[i], xx, s2)); 1679566063dSJacob Faibussowitsch PetscCall(VecNorm(s1, NORM_2, &s1norm)); 1689566063dSJacob Faibussowitsch PetscCall(VecNorm(s2, NORM_2, &s2norm)); 169c4762a1bSJed Brown rnorm = s2norm - s1norm; 17048a46eb9SPierre Jolivet if (rnorm < -tol || rnorm > tol) PetscCall(PetscPrintf(PETSC_COMM_SELF, "[%d]Error:MatMult - Norm1=%16.14e Norm2=%16.14e\n", rank, (double)s1norm, (double)s2norm)); 171c4762a1bSJed Brown } 1729566063dSJacob Faibussowitsch PetscCall(VecDestroy(&xx)); 1739566063dSJacob Faibussowitsch PetscCall(VecDestroy(&s1)); 1749566063dSJacob Faibussowitsch PetscCall(VecDestroy(&s2)); 175c4762a1bSJed Brown } 176c4762a1bSJed Brown 177c4762a1bSJed Brown /* Free allocated memory */ 178c4762a1bSJed Brown for (i = 0; i < nd; ++i) { 1799566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is1[i])); 1809566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is2[i])); 181c4762a1bSJed Brown } 1829566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices(nd, &submatA)); 1839566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices(nd, &submatB)); 184c4762a1bSJed Brown 1859566063dSJacob Faibussowitsch PetscCall(PetscFree(is1)); 1869566063dSJacob Faibussowitsch PetscCall(PetscFree(is2)); 1879566063dSJacob Faibussowitsch PetscCall(PetscFree(idx)); 1889566063dSJacob Faibussowitsch PetscCall(PetscFree(rows)); 1899566063dSJacob Faibussowitsch PetscCall(PetscFree(cols)); 1909566063dSJacob Faibussowitsch PetscCall(PetscFree(vals)); 1919566063dSJacob Faibussowitsch PetscCall(MatDestroy(&A)); 1929566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 1939566063dSJacob Faibussowitsch PetscCall(PetscRandomDestroy(&rdm)); 1949566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 195b122ec5aSJacob Faibussowitsch return 0; 196c4762a1bSJed Brown } 197c4762a1bSJed Brown 198c4762a1bSJed Brown /*TEST 199c4762a1bSJed Brown 200c4762a1bSJed Brown test: 201c4762a1bSJed Brown nsize: {{1 3}} 20282b5ce2aSStefano Zampini args: -mat_block_size {{1 3 4 6 8}} -ov {{1 3}} -mat_size {{11 13}} -nd 7 203c4762a1bSJed Brown output_file: output/ex54.out 204c4762a1bSJed Brown 205c4762a1bSJed Brown test: 206c4762a1bSJed Brown suffix: 2 207c4762a1bSJed Brown args: -nd 2 -test_nd0 208c4762a1bSJed Brown output_file: output/ex54.out 209c4762a1bSJed Brown 210c4762a1bSJed Brown test: 211c4762a1bSJed Brown suffix: 3 212c4762a1bSJed Brown nsize: 3 213c4762a1bSJed Brown args: -nd 2 -test_nd0 214c4762a1bSJed Brown output_file: output/ex54.out 215c4762a1bSJed Brown 216c4762a1bSJed Brown TEST*/ 217