xref: /petsc/src/mat/tests/ex132.c (revision 9566063d113dddea24716c546802770db7481bc0)
1c4762a1bSJed Brown 
2039c6fbaSStefano Zampini static char help[] = "Test MatAXPY()\n\n";
3c4762a1bSJed Brown 
4c4762a1bSJed Brown #include <petscmat.h>
5c4762a1bSJed Brown 
6c4762a1bSJed Brown int main(int argc,char **args)
7c4762a1bSJed Brown {
8b84f494bSStefano Zampini   Mat            C,C1,C2,CU;
9c4762a1bSJed Brown   PetscScalar    v;
10c4762a1bSJed Brown   PetscInt       Ii,J,Istart,Iend;
11039c6fbaSStefano Zampini   PetscInt       i,j,m = 3,n;
12039c6fbaSStefano Zampini   PetscMPIInt    size;
13b84f494bSStefano Zampini   PetscBool      mat_nonsymmetric = PETSC_FALSE,flg;
14c4762a1bSJed Brown   MatInfo        info;
15c4762a1bSJed Brown 
16*9566063dSJacob Faibussowitsch   PetscCall(PetscInitialize(&argc,&args,(char*)0,help));
17*9566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL));
18*9566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
19c4762a1bSJed Brown   n    = 2*size;
20c4762a1bSJed Brown 
21c4762a1bSJed Brown   /* Set flag if we are doing a nonsymmetric problem; the default is symmetric. */
22*9566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(NULL,NULL,"-mat_nonsym",&mat_nonsymmetric,NULL));
23c4762a1bSJed Brown 
24*9566063dSJacob Faibussowitsch   PetscCall(MatCreate(PETSC_COMM_WORLD,&C));
25*9566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n));
26*9566063dSJacob Faibussowitsch   PetscCall(MatSetFromOptions(C));
27*9566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(C,5,NULL));
28*9566063dSJacob Faibussowitsch   PetscCall(MatMPIAIJSetPreallocation(C,5,NULL,5,NULL));
29c4762a1bSJed Brown 
30*9566063dSJacob Faibussowitsch   PetscCall(MatGetOwnershipRange(C,&Istart,&Iend));
31c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
32c4762a1bSJed Brown     v = -1.0; i = Ii/n; j = Ii - i*n;
33*9566063dSJacob Faibussowitsch     if (i>0)   {J = Ii - n; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
34*9566063dSJacob Faibussowitsch     if (i<m-1) {J = Ii + n; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
35*9566063dSJacob Faibussowitsch     if (j>0)   {J = Ii - 1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
36*9566063dSJacob Faibussowitsch     if (j<n-1) {J = Ii + 1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
37*9566063dSJacob Faibussowitsch     v = 4.0; PetscCall(MatSetValues(C,1,&Ii,1,&Ii,&v,ADD_VALUES));
38c4762a1bSJed Brown   }
39c4762a1bSJed Brown 
40c4762a1bSJed Brown   /* Make the matrix nonsymmetric if desired */
41c4762a1bSJed Brown   if (mat_nonsymmetric) {
42c4762a1bSJed Brown     for (Ii=Istart; Ii<Iend; Ii++) {
43c4762a1bSJed Brown       v = -1.5; i = Ii/n;
44*9566063dSJacob Faibussowitsch       if (i>1) {J = Ii-n-1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
45c4762a1bSJed Brown     }
46c4762a1bSJed Brown   } else {
47*9566063dSJacob Faibussowitsch     PetscCall(MatSetOption(C,MAT_SYMMETRIC,PETSC_TRUE));
48*9566063dSJacob Faibussowitsch     PetscCall(MatSetOption(C,MAT_SYMMETRY_ETERNAL,PETSC_TRUE));
49c4762a1bSJed Brown   }
50*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY));
51*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY));
52*9566063dSJacob Faibussowitsch   PetscCall(PetscObjectSetName((PetscObject)C,"C"));
53*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C,NULL,"-view"));
54c4762a1bSJed Brown 
55b84f494bSStefano Zampini   /* C1 = 2.0*C1 + C, C1 is anti-diagonal and has different non-zeros than C */
56*9566063dSJacob Faibussowitsch   PetscCall(MatCreate(PETSC_COMM_WORLD,&C1));
57*9566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C1,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n));
58*9566063dSJacob Faibussowitsch   PetscCall(MatSetFromOptions(C1));
59*9566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(C1,1,NULL));
60*9566063dSJacob Faibussowitsch   PetscCall(MatMPIAIJSetPreallocation(C1,1,NULL,1,NULL));
61c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
62039c6fbaSStefano Zampini     v = 1.0;
63039c6fbaSStefano Zampini     i = m*n - Ii -1;
64039c6fbaSStefano Zampini     j = Ii;
65*9566063dSJacob Faibussowitsch     PetscCall(MatSetValues(C1,1,&i,1,&j,&v,ADD_VALUES));
66c4762a1bSJed Brown   }
67*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C1,MAT_FINAL_ASSEMBLY));
68*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C1,MAT_FINAL_ASSEMBLY));
69*9566063dSJacob Faibussowitsch   PetscCall(PetscObjectSetName((PetscObject)C1,"C1"));
70*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C1,NULL,"-view"));
71*9566063dSJacob Faibussowitsch   PetscCall(MatDuplicate(C1,MAT_COPY_VALUES,&CU));
72b84f494bSStefano Zampini 
73*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN)...\n"));
74*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN));
75*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN));
76*9566063dSJacob Faibussowitsch   PetscCall(MatGetInfo(C1,MAT_GLOBAL_SUM,&info));
77*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
78*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C1,NULL,"-view"));
79*9566063dSJacob Faibussowitsch   PetscCall(MatMultEqual(CU,C1,10,&flg));
80b84f494bSStefano Zampini   if (!flg) {
81*9566063dSJacob Faibussowitsch     PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly DIFFERENT_NONZERO_PATTERN)\n"));
82*9566063dSJacob Faibussowitsch     PetscCall(MatViewFromOptions(CU,NULL,"-view"));
83b84f494bSStefano Zampini   }
84*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&CU));
85c4762a1bSJed Brown 
86b84f494bSStefano Zampini   /* Secondly, compute C1 = 2.0*C2 + C1, C2 has non-zero pattern of C */
87*9566063dSJacob Faibussowitsch   PetscCall(MatDuplicate(C,MAT_DO_NOT_COPY_VALUES,&C2));
88*9566063dSJacob Faibussowitsch   PetscCall(MatDuplicate(C1,MAT_COPY_VALUES,&CU));
89c4762a1bSJed Brown 
90c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
91c4762a1bSJed Brown     v    = 1.0;
92*9566063dSJacob Faibussowitsch     PetscCall(MatSetValues(C2,1,&Ii,1,&Ii,&v,ADD_VALUES));
93c4762a1bSJed Brown   }
94*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C2,MAT_FINAL_ASSEMBLY));
95*9566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C2,MAT_FINAL_ASSEMBLY));
96*9566063dSJacob Faibussowitsch   PetscCall(PetscObjectSetName((PetscObject)C2,"C2"));
97*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C2,NULL,"-view"));
98*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN)...\n"));
99*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN));
100*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(CU,2.0,C2,UNKNOWN_NONZERO_PATTERN));
101*9566063dSJacob Faibussowitsch   PetscCall(MatGetInfo(C1,MAT_GLOBAL_SUM,&info));
102*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
103*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C1,NULL,"-view"));
104*9566063dSJacob Faibussowitsch   PetscCall(MatMultEqual(CU,C1,10,&flg));
105b84f494bSStefano Zampini   if (!flg) {
106*9566063dSJacob Faibussowitsch     PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n"));
107*9566063dSJacob Faibussowitsch     PetscCall(MatViewFromOptions(CU,NULL,"-view"));
108b84f494bSStefano Zampini   }
109*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&CU));
110039c6fbaSStefano Zampini 
111b84f494bSStefano Zampini   /* Test SAME_NONZERO_PATTERN computing C2 = C2 + 2.0 * C */
112*9566063dSJacob Faibussowitsch   PetscCall(MatDuplicate(C2,MAT_COPY_VALUES,&CU));
113*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN)...\n"));
114*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN));
115*9566063dSJacob Faibussowitsch   PetscCall(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN));
116*9566063dSJacob Faibussowitsch   PetscCall(MatGetInfo(C2,MAT_GLOBAL_SUM,&info));
117*9566063dSJacob Faibussowitsch   PetscCall(PetscPrintf(PETSC_COMM_WORLD," C2: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
118*9566063dSJacob Faibussowitsch   PetscCall(MatViewFromOptions(C2,NULL,"-view"));
119*9566063dSJacob Faibussowitsch   PetscCall(MatMultEqual(CU,C2,10,&flg));
120b84f494bSStefano Zampini   if (!flg) {
121*9566063dSJacob Faibussowitsch     PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n"));
122*9566063dSJacob Faibussowitsch     PetscCall(MatViewFromOptions(CU,NULL,"-view"));
123b84f494bSStefano Zampini   }
124*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&CU));
125c4762a1bSJed Brown 
126*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&C1));
127*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&C2));
128*9566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&C));
129c4762a1bSJed Brown 
130*9566063dSJacob Faibussowitsch   PetscCall(PetscFinalize());
131b122ec5aSJacob Faibussowitsch   return 0;
132c4762a1bSJed Brown }
133c4762a1bSJed Brown 
134c4762a1bSJed Brown /*TEST
135c4762a1bSJed Brown 
136c4762a1bSJed Brown    test:
137039c6fbaSStefano Zampini      suffix: 1
138039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
139039c6fbaSStefano Zampini      args: -view
140039c6fbaSStefano Zampini      diff_args: -j
141039c6fbaSStefano Zampini 
142039c6fbaSStefano Zampini    test:
143039c6fbaSStefano Zampini      output_file: output/ex132_1.out
144039c6fbaSStefano Zampini      requires: cuda
145039c6fbaSStefano Zampini      suffix: 1_cuda
146039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
147039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse
148039c6fbaSStefano Zampini      diff_args: -j
149039c6fbaSStefano Zampini 
150039c6fbaSStefano Zampini    test:
151039c6fbaSStefano Zampini      output_file: output/ex132_1.out
152039c6fbaSStefano Zampini      requires: kokkos_kernels
153039c6fbaSStefano Zampini      suffix: 1_kokkos
154039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
155039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos
156039c6fbaSStefano Zampini      diff_args: -j
157039c6fbaSStefano Zampini 
158039c6fbaSStefano Zampini    test:
159039c6fbaSStefano Zampini      suffix: 2
160039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
161039c6fbaSStefano Zampini      args: -view -mat_nonsym
162039c6fbaSStefano Zampini      diff_args: -j
163039c6fbaSStefano Zampini 
164039c6fbaSStefano Zampini    test:
165039c6fbaSStefano Zampini      output_file: output/ex132_2.out
166039c6fbaSStefano Zampini      requires: cuda
167039c6fbaSStefano Zampini      suffix: 2_cuda
168039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
169039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse -mat_nonsym
170039c6fbaSStefano Zampini      diff_args: -j
171039c6fbaSStefano Zampini 
172039c6fbaSStefano Zampini    test:
173039c6fbaSStefano Zampini      output_file: output/ex132_2.out
174039c6fbaSStefano Zampini      requires: kokkos_kernels
175039c6fbaSStefano Zampini      suffix: 2_kokkos
176039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
177039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos -mat_nonsym
178039c6fbaSStefano Zampini      diff_args: -j
179039c6fbaSStefano Zampini 
180039c6fbaSStefano Zampini    test:
181039c6fbaSStefano Zampini      nsize: 2
182039c6fbaSStefano Zampini      suffix: 1_par
183039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
184039c6fbaSStefano Zampini      args: -view
185039c6fbaSStefano Zampini      diff_args: -j
186039c6fbaSStefano Zampini 
187039c6fbaSStefano Zampini    test:
188039c6fbaSStefano Zampini      nsize: 2
189039c6fbaSStefano Zampini      output_file: output/ex132_1_par.out
190039c6fbaSStefano Zampini      requires: cuda
191039c6fbaSStefano Zampini      suffix: 1_par_cuda
192039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
193039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse
194039c6fbaSStefano Zampini      diff_args: -j
195039c6fbaSStefano Zampini 
196039c6fbaSStefano Zampini    test:
197039c6fbaSStefano Zampini      nsize: 2
198039c6fbaSStefano Zampini      output_file: output/ex132_1_par.out
1993078479eSJunchao Zhang      requires: !sycl kokkos_kernels
200039c6fbaSStefano Zampini      suffix: 1_par_kokkos
201039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
202039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos
203039c6fbaSStefano Zampini      diff_args: -j
204039c6fbaSStefano Zampini 
205039c6fbaSStefano Zampini    test:
206039c6fbaSStefano Zampini      nsize: 2
207039c6fbaSStefano Zampini      suffix: 2_par
208039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
209039c6fbaSStefano Zampini      args: -view -mat_nonsym
210039c6fbaSStefano Zampini      diff_args: -j
211039c6fbaSStefano Zampini 
212039c6fbaSStefano Zampini    test:
213039c6fbaSStefano Zampini      nsize: 2
214039c6fbaSStefano Zampini      output_file: output/ex132_2_par.out
215039c6fbaSStefano Zampini      requires: cuda
216039c6fbaSStefano Zampini      suffix: 2_par_cuda
217039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
218039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse -mat_nonsym
219039c6fbaSStefano Zampini      diff_args: -j
220039c6fbaSStefano Zampini 
221f3482364SScott Kruger    testset:
222039c6fbaSStefano Zampini      nsize: 2
223039c6fbaSStefano Zampini      output_file: output/ex132_2_par.out
2243078479eSJunchao Zhang      requires: !sycl kokkos_kernels
225039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
226f3482364SScott Kruger      args: -view -mat_type aijkokkos -mat_nonsym
227039c6fbaSStefano Zampini      diff_args: -j
228f3482364SScott Kruger      test:
229f3482364SScott Kruger        suffix: 2_par_kokkos_no_gpu_aware
230f3482364SScott Kruger        args: -use_gpu_aware_mpi 0
231f3482364SScott Kruger      test:
232f3482364SScott Kruger        requires: defined(HAVE_MPI_GPU_AWARE)
233f3482364SScott Kruger        suffix: 2_par_kokkos_gpu_aware
234f3482364SScott Kruger        args: -use_gpu_aware_mpi 1
235c4762a1bSJed Brown 
236c4762a1bSJed Brown TEST*/
237