xref: /petsc/src/mat/tests/ex18.c (revision 1baa6e3354bfe224b33a0c158f482508792a8a6e)
1c4762a1bSJed Brown static char help[] = "Tests the use of MatZeroRowsColumns() for parallel matrices.\n\
2c4762a1bSJed Brown Contributed-by: Stephan Kramer <s.kramer@imperial.ac.uk>\n\n";
3c4762a1bSJed Brown 
4c4762a1bSJed Brown #include <petscmat.h>
5c4762a1bSJed Brown 
6c4762a1bSJed Brown int main(int argc,char **args)
7c4762a1bSJed Brown {
8c4762a1bSJed Brown   Mat            A;
9c4762a1bSJed Brown   Vec            x, rhs, y;
10c4762a1bSJed Brown   PetscInt       i,j,k,b,m = 3,n,nlocal=2,bs=1,Ii,J;
11c4762a1bSJed Brown   PetscInt       *boundary_nodes, nboundary_nodes, *boundary_indices;
12c4762a1bSJed Brown   PetscMPIInt    rank,size;
13c4762a1bSJed Brown   PetscScalar    v,v0,v1,v2,a0=0.1,a,rhsval, *boundary_values,diag = 1.0;
14c4762a1bSJed Brown   PetscReal      norm;
15c4762a1bSJed Brown   char           convname[64];
16c4762a1bSJed Brown   PetscBool      upwind = PETSC_FALSE, nonlocalBC = PETSC_FALSE, zerorhs = PETSC_TRUE, convert = PETSC_FALSE;
17c4762a1bSJed Brown 
189566063dSJacob Faibussowitsch   PetscCall(PetscInitialize(&argc,&args,(char*)0,help));
199566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank));
209566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
21c4762a1bSJed Brown   n = nlocal*size;
22c4762a1bSJed Brown 
239566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetInt(NULL,NULL, "-bs", &bs, NULL));
249566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL,NULL, "-nonlocal_bc", &nonlocalBC, NULL));
259566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetScalar(NULL,NULL, "-diag", &diag, NULL));
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetString(NULL,NULL,"-convname",convname,sizeof(convname),&convert));
279566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL,NULL, "-zerorhs", &zerorhs, NULL));
28c4762a1bSJed Brown 
299566063dSJacob Faibussowitsch   PetscCall(MatCreate(PETSC_COMM_WORLD,&A));
309566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(A,PETSC_DECIDE,PETSC_DECIDE,m*n*bs,m*n*bs));
319566063dSJacob Faibussowitsch   PetscCall(MatSetFromOptions(A));
329566063dSJacob Faibussowitsch   PetscCall(MatSetUp(A));
33c4762a1bSJed Brown 
349566063dSJacob Faibussowitsch   PetscCall(MatCreateVecs(A, NULL, &rhs));
359566063dSJacob Faibussowitsch   PetscCall(VecSetFromOptions(rhs));
369566063dSJacob Faibussowitsch   PetscCall(VecSetUp(rhs));
37c4762a1bSJed Brown 
38c4762a1bSJed Brown   rhsval = 0.0;
39c4762a1bSJed Brown   for (i=0; i<m; i++) {
40c4762a1bSJed Brown     for (j=nlocal*rank; j<nlocal*(rank+1); j++) {
41c4762a1bSJed Brown       a = a0;
42c4762a1bSJed Brown       for (b=0; b<bs; b++) {
43c4762a1bSJed Brown         /* let's start with a 5-point stencil diffusion term */
44c4762a1bSJed Brown         v = -1.0;  Ii = (j + n*i)*bs + b;
459566063dSJacob Faibussowitsch         if (i>0)   {J = Ii - n*bs; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
469566063dSJacob Faibussowitsch         if (i<m-1) {J = Ii + n*bs; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
479566063dSJacob Faibussowitsch         if (j>0)   {J = Ii - 1*bs; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
489566063dSJacob Faibussowitsch         if (j<n-1) {J = Ii + 1*bs; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
499566063dSJacob Faibussowitsch         v = 4.0; PetscCall(MatSetValues(A,1,&Ii,1,&Ii,&v,ADD_VALUES));
50c4762a1bSJed Brown         if (upwind) {
51c4762a1bSJed Brown           /* now add a 2nd order upwind advection term to add a little asymmetry */
52c4762a1bSJed Brown           if (j>2) {
53c4762a1bSJed Brown             J = Ii-2*bs; v2 = 0.5*a; v1 = -2.0*a; v0 = 1.5*a;
549566063dSJacob Faibussowitsch             PetscCall(MatSetValues(A,1,&Ii,1,&J,&v2,ADD_VALUES));
55c4762a1bSJed Brown           } else {
56c4762a1bSJed Brown             /* fall back to 1st order upwind */
57c4762a1bSJed Brown             v1 = -1.0*a; v0 = 1.0*a;
58c4762a1bSJed Brown           };
599566063dSJacob Faibussowitsch           if (j>1) {J = Ii-1*bs; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v1,ADD_VALUES));}
609566063dSJacob Faibussowitsch           PetscCall(MatSetValues(A,1,&Ii,1,&Ii,&v0,ADD_VALUES));
61c4762a1bSJed Brown           a /= 10.; /* use a different velocity for the next component */
62c4762a1bSJed Brown           /* add a coupling to the previous and next components */
63c4762a1bSJed Brown           v = 0.5;
649566063dSJacob Faibussowitsch           if (b>0) {J = Ii - 1; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
659566063dSJacob Faibussowitsch           if (b<bs-1) {J = Ii + 1; PetscCall(MatSetValues(A,1,&Ii,1,&J,&v,ADD_VALUES));}
66c4762a1bSJed Brown         }
67c4762a1bSJed Brown         /* make up some rhs */
689566063dSJacob Faibussowitsch         PetscCall(VecSetValue(rhs, Ii, rhsval, INSERT_VALUES));
69c4762a1bSJed Brown         rhsval += 1.0;
70c4762a1bSJed Brown       }
71c4762a1bSJed Brown     }
72c4762a1bSJed Brown   }
739566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY));
749566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY));
75c4762a1bSJed Brown 
76c4762a1bSJed Brown   if (convert) { /* Test different Mat implementations */
77c4762a1bSJed Brown     Mat B;
78c4762a1bSJed Brown 
799566063dSJacob Faibussowitsch     PetscCall(MatConvert(A,convname,MAT_INITIAL_MATRIX,&B));
809566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&A));
81c4762a1bSJed Brown     A    = B;
82c4762a1bSJed Brown   }
83c4762a1bSJed Brown 
849566063dSJacob Faibussowitsch   PetscCall(VecAssemblyBegin(rhs));
859566063dSJacob Faibussowitsch   PetscCall(VecAssemblyEnd(rhs));
86c4762a1bSJed Brown   /* set rhs to zero to simplify */
87*1baa6e33SBarry Smith   if (zerorhs) PetscCall(VecZeroEntries(rhs));
88c4762a1bSJed Brown 
89c4762a1bSJed Brown   if (nonlocalBC) {
90c4762a1bSJed Brown     /*version where boundary conditions are set by processes that don't necessarily own the nodes */
91dd400576SPatrick Sanan     if (rank == 0) {
92c4762a1bSJed Brown       nboundary_nodes = size>m ? nlocal : m-size+nlocal;
939566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nboundary_nodes,&boundary_nodes));
94c4762a1bSJed Brown       k = 0;
95c4762a1bSJed Brown       for (i=size; i<m; i++,k++) {boundary_nodes[k] = n*i;};
96c4762a1bSJed Brown     } else if (rank < m) {
97c4762a1bSJed Brown       nboundary_nodes = nlocal+1;
989566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nboundary_nodes,&boundary_nodes));
99c4762a1bSJed Brown       boundary_nodes[0] = rank*n;
100c4762a1bSJed Brown       k = 1;
101c4762a1bSJed Brown     } else {
102c4762a1bSJed Brown       nboundary_nodes = nlocal;
1039566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nboundary_nodes,&boundary_nodes));
104c4762a1bSJed Brown       k = 0;
105c4762a1bSJed Brown     }
106c4762a1bSJed Brown     for (j=nlocal*rank; j<nlocal*(rank+1); j++,k++) {boundary_nodes[k] = j;};
107c4762a1bSJed Brown   } else {
108c4762a1bSJed Brown     /*version where boundary conditions are set by the node owners only */
1099566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m*n,&boundary_nodes));
110c4762a1bSJed Brown     k=0;
111c4762a1bSJed Brown     for (j=0; j<n; j++) {
112c4762a1bSJed Brown       Ii = j;
113c4762a1bSJed Brown       if (Ii>=rank*m*nlocal && Ii<(rank+1)*m*nlocal) boundary_nodes[k++] = Ii;
114c4762a1bSJed Brown     }
115c4762a1bSJed Brown     for (i=1; i<m; i++) {
116c4762a1bSJed Brown       Ii = n*i;
117c4762a1bSJed Brown       if (Ii>=rank*m*nlocal && Ii<(rank+1)*m*nlocal) boundary_nodes[k++] = Ii;
118c4762a1bSJed Brown     }
119c4762a1bSJed Brown     nboundary_nodes = k;
120c4762a1bSJed Brown   }
121c4762a1bSJed Brown 
1229566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(rhs, &x));
1239566063dSJacob Faibussowitsch   PetscCall(VecZeroEntries(x));
1249566063dSJacob Faibussowitsch   PetscCall(PetscMalloc2(nboundary_nodes*bs,&boundary_indices,nboundary_nodes*bs,&boundary_values));
125c4762a1bSJed Brown   for (k=0; k<nboundary_nodes; k++) {
126c4762a1bSJed Brown     Ii = boundary_nodes[k]*bs;
127c4762a1bSJed Brown     v = 1.0*boundary_nodes[k];
128c4762a1bSJed Brown     for (b=0; b<bs; b++, Ii++) {
129c4762a1bSJed Brown       boundary_indices[k*bs+b] = Ii;
130c4762a1bSJed Brown       boundary_values[k*bs+b] = v;
1319566063dSJacob Faibussowitsch       PetscCall(PetscSynchronizedPrintf(PETSC_COMM_WORLD, "%d %" PetscInt_FMT " %f\n", rank, Ii, (double)PetscRealPart(v)));
132c4762a1bSJed Brown       v += 0.1;
133c4762a1bSJed Brown     }
134c4762a1bSJed Brown   }
1359566063dSJacob Faibussowitsch   PetscCall(PetscSynchronizedFlush(PETSC_COMM_WORLD, NULL));
1369566063dSJacob Faibussowitsch   PetscCall(VecSetValues(x, nboundary_nodes*bs, boundary_indices, boundary_values, INSERT_VALUES));
1379566063dSJacob Faibussowitsch   PetscCall(VecAssemblyBegin(x));
1389566063dSJacob Faibussowitsch   PetscCall(VecAssemblyEnd(x));
139c4762a1bSJed Brown 
140c4762a1bSJed Brown   /* We can check the rhs returned by MatZeroColumns by computing y=rhs-A*x  and overwriting the boundary entries with boundary values */
1419566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(x, &y));
1429566063dSJacob Faibussowitsch   PetscCall(MatMult(A, x, y));
1439566063dSJacob Faibussowitsch   PetscCall(VecAYPX(y, -1.0, rhs));
144c4762a1bSJed Brown   for (k=0; k<nboundary_nodes*bs; k++) boundary_values[k] *= diag;
1459566063dSJacob Faibussowitsch   PetscCall(VecSetValues(y, nboundary_nodes*bs, boundary_indices, boundary_values, INSERT_VALUES));
1469566063dSJacob Faibussowitsch   PetscCall(VecAssemblyBegin(y));
1479566063dSJacob Faibussowitsch   PetscCall(VecAssemblyEnd(y));
148c4762a1bSJed Brown 
1499566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD, "*** Matrix A and vector x:\n"));
1509566063dSJacob Faibussowitsch   PetscCall(MatView(A, PETSC_VIEWER_STDOUT_WORLD));
1519566063dSJacob Faibussowitsch   PetscCall(VecView(x,PETSC_VIEWER_STDOUT_WORLD));
152c4762a1bSJed Brown 
1539566063dSJacob Faibussowitsch   PetscCall(MatZeroRowsColumns(A, nboundary_nodes*bs, boundary_indices, diag, x, rhs));
1549566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD, "*** Vector rhs returned by MatZeroRowsColumns\n"));
1559566063dSJacob Faibussowitsch   PetscCall(VecView(rhs,PETSC_VIEWER_STDOUT_WORLD));
1569566063dSJacob Faibussowitsch   PetscCall(VecAXPY(y, -1.0, rhs));
1579566063dSJacob Faibussowitsch   PetscCall(VecNorm(y, NORM_INFINITY, &norm));
158c4762a1bSJed Brown   if (norm > 1.0e-10) {
1599566063dSJacob Faibussowitsch     PetscCall(PetscPrintf(PETSC_COMM_WORLD, "*** Difference between rhs and y, inf-norm: %f\n", (double)norm));
1609566063dSJacob Faibussowitsch     PetscCall(VecView(y,PETSC_VIEWER_STDOUT_WORLD));
161c4762a1bSJed Brown     SETERRQ(PETSC_COMM_WORLD, PETSC_ERR_PLIB, "Bug in MatZeroRowsColumns");
162c4762a1bSJed Brown   }
163c4762a1bSJed Brown 
1649566063dSJacob Faibussowitsch   PetscCall(PetscFree(boundary_nodes));
1659566063dSJacob Faibussowitsch   PetscCall(PetscFree2(boundary_indices,boundary_values));
1669566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&x));
1679566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&y));
1689566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&rhs));
1699566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&A));
170c4762a1bSJed Brown 
1719566063dSJacob Faibussowitsch   PetscCall(PetscFinalize());
172b122ec5aSJacob Faibussowitsch   return 0;
173c4762a1bSJed Brown }
174c4762a1bSJed Brown 
175c4762a1bSJed Brown /*TEST
176c4762a1bSJed Brown 
177c4762a1bSJed Brown    test:
1789fd945daSStefano Zampini       diff_args: -j
179c4762a1bSJed Brown       suffix: 0
180c4762a1bSJed Brown 
181c4762a1bSJed Brown    test:
1829fd945daSStefano Zampini       diff_args: -j
183c4762a1bSJed Brown       suffix: 1
184c4762a1bSJed Brown       nsize: 2
185c4762a1bSJed Brown 
186c4762a1bSJed Brown    test:
1879fd945daSStefano Zampini       diff_args: -j
188c4762a1bSJed Brown       suffix: 10
189c4762a1bSJed Brown       nsize: 2
190c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc
191c4762a1bSJed Brown 
192c4762a1bSJed Brown    test:
1939fd945daSStefano Zampini       diff_args: -j
194c4762a1bSJed Brown       suffix: 11
195c4762a1bSJed Brown       nsize: 7
196c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc
197c4762a1bSJed Brown 
198c4762a1bSJed Brown    test:
1999fd945daSStefano Zampini       diff_args: -j
200c4762a1bSJed Brown       suffix: 12
201c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -mat_type baij
202c4762a1bSJed Brown 
203c4762a1bSJed Brown    test:
2049fd945daSStefano Zampini       diff_args: -j
205c4762a1bSJed Brown       suffix: 13
206c4762a1bSJed Brown       nsize: 2
207c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -mat_type baij
208c4762a1bSJed Brown 
209c4762a1bSJed Brown    test:
2109fd945daSStefano Zampini       diff_args: -j
211c4762a1bSJed Brown       suffix: 14
212c4762a1bSJed Brown       nsize: 7
213c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -mat_type baij
214c4762a1bSJed Brown 
215c4762a1bSJed Brown    test:
2169fd945daSStefano Zampini       diff_args: -j
217c4762a1bSJed Brown       suffix: 2
218c4762a1bSJed Brown       nsize: 7
219c4762a1bSJed Brown 
220c4762a1bSJed Brown    test:
2219fd945daSStefano Zampini       diff_args: -j
222c4762a1bSJed Brown       suffix: 3
223c4762a1bSJed Brown       args: -mat_type baij
224c4762a1bSJed Brown 
225c4762a1bSJed Brown    test:
2269fd945daSStefano Zampini       diff_args: -j
227c4762a1bSJed Brown       suffix: 4
228c4762a1bSJed Brown       nsize: 2
229c4762a1bSJed Brown       args: -mat_type baij
230c4762a1bSJed Brown 
231c4762a1bSJed Brown    test:
2329fd945daSStefano Zampini       diff_args: -j
233c4762a1bSJed Brown       suffix: 5
234c4762a1bSJed Brown       nsize: 7
235c4762a1bSJed Brown       args: -mat_type baij
236c4762a1bSJed Brown 
237c4762a1bSJed Brown    test:
2389fd945daSStefano Zampini       diff_args: -j
239c4762a1bSJed Brown       suffix: 6
240c4762a1bSJed Brown       args: -bs 2 -mat_type baij
241c4762a1bSJed Brown 
242c4762a1bSJed Brown    test:
2439fd945daSStefano Zampini       diff_args: -j
244c4762a1bSJed Brown       suffix: 7
245c4762a1bSJed Brown       nsize: 2
246c4762a1bSJed Brown       args: -bs 2 -mat_type baij
247c4762a1bSJed Brown 
248c4762a1bSJed Brown    test:
2499fd945daSStefano Zampini       diff_args: -j
250c4762a1bSJed Brown       suffix: 8
251c4762a1bSJed Brown       nsize: 7
252c4762a1bSJed Brown       args: -bs 2 -mat_type baij
253c4762a1bSJed Brown 
254c4762a1bSJed Brown    test:
2559fd945daSStefano Zampini       diff_args: -j
256c4762a1bSJed Brown       suffix: 9
257c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc
258c4762a1bSJed Brown 
259c4762a1bSJed Brown    test:
2609fd945daSStefano Zampini       diff_args: -j
261c4762a1bSJed Brown       suffix: 15
262c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -convname shell
263c4762a1bSJed Brown 
264c4762a1bSJed Brown    test:
2659fd945daSStefano Zampini       diff_args: -j
266c4762a1bSJed Brown       suffix: 16
267c4762a1bSJed Brown       nsize: 2
268c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -convname shell
269c4762a1bSJed Brown 
270c4762a1bSJed Brown    test:
2719fd945daSStefano Zampini       diff_args: -j
272c4762a1bSJed Brown       suffix: 17
273c4762a1bSJed Brown       args: -bs 2 -nonlocal_bc -convname dense
274c4762a1bSJed Brown 
275c4762a1bSJed Brown    testset:
2769fd945daSStefano Zampini       diff_args: -j
277c4762a1bSJed Brown       suffix: full
278c4762a1bSJed Brown       nsize: {{1 3}separate output}
279c4762a1bSJed Brown       args: -diag {{0.12 -0.13}separate output} -convname {{aij shell baij}separate output} -zerorhs 0
28038a8e8c1SStefano Zampini 
28138a8e8c1SStefano Zampini    test:
2829fd945daSStefano Zampini       diff_args: -j
28338a8e8c1SStefano Zampini       requires: cuda
28438a8e8c1SStefano Zampini       suffix: cusparse_1
28538a8e8c1SStefano Zampini       nsize: 1
28638a8e8c1SStefano Zampini       args: -diag {{0.12 -0.13}separate output} -convname {{seqaijcusparse mpiaijcusparse}separate output} -zerorhs 0 -mat_type {{seqaijcusparse mpiaijcusparse}separate output}
28738a8e8c1SStefano Zampini 
28838a8e8c1SStefano Zampini    test:
2899fd945daSStefano Zampini       diff_args: -j
29038a8e8c1SStefano Zampini       requires: cuda
29138a8e8c1SStefano Zampini       suffix: cusparse_3
29238a8e8c1SStefano Zampini       nsize: 3
29338a8e8c1SStefano Zampini       args: -diag {{0.12 -0.13}separate output} -convname mpiaijcusparse -zerorhs 0 -mat_type mpiaijcusparse
29438a8e8c1SStefano Zampini 
295c4762a1bSJed Brown TEST*/
296