xref: /petsc/src/mat/tests/ex132.c (revision 5f80ce2ab25dff0f4601e710601cbbcecf323266)
1c4762a1bSJed Brown 
2039c6fbaSStefano Zampini static char help[] = "Test MatAXPY()\n\n";
3c4762a1bSJed Brown 
4c4762a1bSJed Brown #include <petscmat.h>
5c4762a1bSJed Brown 
6c4762a1bSJed Brown int main(int argc,char **args)
7c4762a1bSJed Brown {
8b84f494bSStefano Zampini   Mat            C,C1,C2,CU;
9c4762a1bSJed Brown   PetscScalar    v;
10c4762a1bSJed Brown   PetscInt       Ii,J,Istart,Iend;
11c4762a1bSJed Brown   PetscErrorCode ierr;
12039c6fbaSStefano Zampini   PetscInt       i,j,m = 3,n;
13039c6fbaSStefano Zampini   PetscMPIInt    size;
14b84f494bSStefano Zampini   PetscBool      mat_nonsymmetric = PETSC_FALSE,flg;
15c4762a1bSJed Brown   MatInfo        info;
16c4762a1bSJed Brown 
17c4762a1bSJed Brown   ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr;
18*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL));
19*5f80ce2aSJacob Faibussowitsch   CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
20c4762a1bSJed Brown   n    = 2*size;
21c4762a1bSJed Brown 
22c4762a1bSJed Brown   /* Set flag if we are doing a nonsymmetric problem; the default is symmetric. */
23*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscOptionsGetBool(NULL,NULL,"-mat_nonsym",&mat_nonsymmetric,NULL));
24c4762a1bSJed Brown 
25*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreate(PETSC_COMM_WORLD,&C));
26*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetSizes(C,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n));
27*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetFromOptions(C));
28*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSeqAIJSetPreallocation(C,5,NULL));
29*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMPIAIJSetPreallocation(C,5,NULL,5,NULL));
30c4762a1bSJed Brown 
31*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetOwnershipRange(C,&Istart,&Iend));
32c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
33c4762a1bSJed Brown     v = -1.0; i = Ii/n; j = Ii - i*n;
34*5f80ce2aSJacob Faibussowitsch     if (i>0)   {J = Ii - n; CHKERRQ(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
35*5f80ce2aSJacob Faibussowitsch     if (i<m-1) {J = Ii + n; CHKERRQ(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
36*5f80ce2aSJacob Faibussowitsch     if (j>0)   {J = Ii - 1; CHKERRQ(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
37*5f80ce2aSJacob Faibussowitsch     if (j<n-1) {J = Ii + 1; CHKERRQ(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
38*5f80ce2aSJacob Faibussowitsch     v = 4.0; CHKERRQ(MatSetValues(C,1,&Ii,1,&Ii,&v,ADD_VALUES));
39c4762a1bSJed Brown   }
40c4762a1bSJed Brown 
41c4762a1bSJed Brown   /* Make the matrix nonsymmetric if desired */
42c4762a1bSJed Brown   if (mat_nonsymmetric) {
43c4762a1bSJed Brown     for (Ii=Istart; Ii<Iend; Ii++) {
44c4762a1bSJed Brown       v = -1.5; i = Ii/n;
45*5f80ce2aSJacob Faibussowitsch       if (i>1) {J = Ii-n-1; CHKERRQ(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));}
46c4762a1bSJed Brown     }
47c4762a1bSJed Brown   } else {
48*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetOption(C,MAT_SYMMETRIC,PETSC_TRUE));
49*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetOption(C,MAT_SYMMETRY_ETERNAL,PETSC_TRUE));
50c4762a1bSJed Brown   }
51*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY));
52*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY));
53*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectSetName((PetscObject)C,"C"));
54*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C,NULL,"-view"));
55c4762a1bSJed Brown 
56b84f494bSStefano Zampini   /* C1 = 2.0*C1 + C, C1 is anti-diagonal and has different non-zeros than C */
57*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatCreate(PETSC_COMM_WORLD,&C1));
58*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetSizes(C1,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n));
59*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSetFromOptions(C1));
60*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatSeqAIJSetPreallocation(C1,1,NULL));
61*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMPIAIJSetPreallocation(C1,1,NULL,1,NULL));
62c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
63039c6fbaSStefano Zampini     v = 1.0;
64039c6fbaSStefano Zampini     i = m*n - Ii -1;
65039c6fbaSStefano Zampini     j = Ii;
66*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetValues(C1,1,&i,1,&j,&v,ADD_VALUES));
67c4762a1bSJed Brown   }
68*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(C1,MAT_FINAL_ASSEMBLY));
69*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(C1,MAT_FINAL_ASSEMBLY));
70*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectSetName((PetscObject)C1,"C1"));
71*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C1,NULL,"-view"));
72*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDuplicate(C1,MAT_COPY_VALUES,&CU));
73b84f494bSStefano Zampini 
74*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN)...\n"));
75*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN));
76*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN));
77*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetInfo(C1,MAT_GLOBAL_SUM,&info));
78*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
79*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C1,NULL,"-view"));
80*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMultEqual(CU,C1,10,&flg));
81b84f494bSStefano Zampini   if (!flg) {
82*5f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly DIFFERENT_NONZERO_PATTERN)\n"));
83*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatViewFromOptions(CU,NULL,"-view"));
84b84f494bSStefano Zampini   }
85*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&CU));
86c4762a1bSJed Brown 
87b84f494bSStefano Zampini   /* Secondly, compute C1 = 2.0*C2 + C1, C2 has non-zero pattern of C */
88*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDuplicate(C,MAT_DO_NOT_COPY_VALUES,&C2));
89*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDuplicate(C1,MAT_COPY_VALUES,&CU));
90c4762a1bSJed Brown 
91c4762a1bSJed Brown   for (Ii=Istart; Ii<Iend; Ii++) {
92c4762a1bSJed Brown     v    = 1.0;
93*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatSetValues(C2,1,&Ii,1,&Ii,&v,ADD_VALUES));
94c4762a1bSJed Brown   }
95*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyBegin(C2,MAT_FINAL_ASSEMBLY));
96*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAssemblyEnd(C2,MAT_FINAL_ASSEMBLY));
97*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscObjectSetName((PetscObject)C2,"C2"));
98*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C2,NULL,"-view"));
99*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN)...\n"));
100*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN));
101*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(CU,2.0,C2,UNKNOWN_NONZERO_PATTERN));
102*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetInfo(C1,MAT_GLOBAL_SUM,&info));
103*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
104*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C1,NULL,"-view"));
105*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMultEqual(CU,C1,10,&flg));
106b84f494bSStefano Zampini   if (!flg) {
107*5f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n"));
108*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatViewFromOptions(CU,NULL,"-view"));
109b84f494bSStefano Zampini   }
110*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&CU));
111039c6fbaSStefano Zampini 
112b84f494bSStefano Zampini   /* Test SAME_NONZERO_PATTERN computing C2 = C2 + 2.0 * C */
113*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDuplicate(C2,MAT_COPY_VALUES,&CU));
114*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN)...\n"));
115*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN));
116*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN));
117*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatGetInfo(C2,MAT_GLOBAL_SUM,&info));
118*5f80ce2aSJacob Faibussowitsch   CHKERRQ(PetscPrintf(PETSC_COMM_WORLD," C2: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded));
119*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatViewFromOptions(C2,NULL,"-view"));
120*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatMultEqual(CU,C2,10,&flg));
121b84f494bSStefano Zampini   if (!flg) {
122*5f80ce2aSJacob Faibussowitsch     CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n"));
123*5f80ce2aSJacob Faibussowitsch     CHKERRQ(MatViewFromOptions(CU,NULL,"-view"));
124b84f494bSStefano Zampini   }
125*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&CU));
126c4762a1bSJed Brown 
127*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&C1));
128*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&C2));
129*5f80ce2aSJacob Faibussowitsch   CHKERRQ(MatDestroy(&C));
130c4762a1bSJed Brown 
131c4762a1bSJed Brown   ierr = PetscFinalize();
132c4762a1bSJed Brown   return ierr;
133c4762a1bSJed Brown }
134c4762a1bSJed Brown 
135c4762a1bSJed Brown /*TEST
136c4762a1bSJed Brown 
137c4762a1bSJed Brown    test:
138039c6fbaSStefano Zampini      suffix: 1
139039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
140039c6fbaSStefano Zampini      args: -view
141039c6fbaSStefano Zampini      diff_args: -j
142039c6fbaSStefano Zampini 
143039c6fbaSStefano Zampini    test:
144039c6fbaSStefano Zampini      output_file: output/ex132_1.out
145039c6fbaSStefano Zampini      requires: cuda
146039c6fbaSStefano Zampini      suffix: 1_cuda
147039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
148039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse
149039c6fbaSStefano Zampini      diff_args: -j
150039c6fbaSStefano Zampini 
151039c6fbaSStefano Zampini    test:
152039c6fbaSStefano Zampini      output_file: output/ex132_1.out
153039c6fbaSStefano Zampini      requires: kokkos_kernels
154039c6fbaSStefano Zampini      suffix: 1_kokkos
155039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
156039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos
157039c6fbaSStefano Zampini      diff_args: -j
158039c6fbaSStefano Zampini 
159039c6fbaSStefano Zampini    test:
160039c6fbaSStefano Zampini      suffix: 2
161039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
162039c6fbaSStefano Zampini      args: -view -mat_nonsym
163039c6fbaSStefano Zampini      diff_args: -j
164039c6fbaSStefano Zampini 
165039c6fbaSStefano Zampini    test:
166039c6fbaSStefano Zampini      output_file: output/ex132_2.out
167039c6fbaSStefano Zampini      requires: cuda
168039c6fbaSStefano Zampini      suffix: 2_cuda
169039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
170039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse -mat_nonsym
171039c6fbaSStefano Zampini      diff_args: -j
172039c6fbaSStefano Zampini 
173039c6fbaSStefano Zampini    test:
174039c6fbaSStefano Zampini      output_file: output/ex132_2.out
175039c6fbaSStefano Zampini      requires: kokkos_kernels
176039c6fbaSStefano Zampini      suffix: 2_kokkos
177039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
178039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos -mat_nonsym
179039c6fbaSStefano Zampini      diff_args: -j
180039c6fbaSStefano Zampini 
181039c6fbaSStefano Zampini    test:
182039c6fbaSStefano Zampini      nsize: 2
183039c6fbaSStefano Zampini      suffix: 1_par
184039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
185039c6fbaSStefano Zampini      args: -view
186039c6fbaSStefano Zampini      diff_args: -j
187039c6fbaSStefano Zampini 
188039c6fbaSStefano Zampini    test:
189039c6fbaSStefano Zampini      nsize: 2
190039c6fbaSStefano Zampini      output_file: output/ex132_1_par.out
191039c6fbaSStefano Zampini      requires: cuda
192039c6fbaSStefano Zampini      suffix: 1_par_cuda
193039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
194039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse
195039c6fbaSStefano Zampini      diff_args: -j
196039c6fbaSStefano Zampini 
197039c6fbaSStefano Zampini    test:
198039c6fbaSStefano Zampini      nsize: 2
199039c6fbaSStefano Zampini      output_file: output/ex132_1_par.out
2003078479eSJunchao Zhang      requires: !sycl kokkos_kernels
201039c6fbaSStefano Zampini      suffix: 1_par_kokkos
202039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
203039c6fbaSStefano Zampini      args: -view -mat_type aijkokkos
204039c6fbaSStefano Zampini      diff_args: -j
205039c6fbaSStefano Zampini 
206039c6fbaSStefano Zampini    test:
207039c6fbaSStefano Zampini      nsize: 2
208039c6fbaSStefano Zampini      suffix: 2_par
209039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
210039c6fbaSStefano Zampini      args: -view -mat_nonsym
211039c6fbaSStefano Zampini      diff_args: -j
212039c6fbaSStefano Zampini 
213039c6fbaSStefano Zampini    test:
214039c6fbaSStefano Zampini      nsize: 2
215039c6fbaSStefano Zampini      output_file: output/ex132_2_par.out
216039c6fbaSStefano Zampini      requires: cuda
217039c6fbaSStefano Zampini      suffix: 2_par_cuda
218039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
219039c6fbaSStefano Zampini      args: -view -mat_type aijcusparse -mat_nonsym
220039c6fbaSStefano Zampini      diff_args: -j
221039c6fbaSStefano Zampini 
222f3482364SScott Kruger    testset:
223039c6fbaSStefano Zampini      nsize: 2
224039c6fbaSStefano Zampini      output_file: output/ex132_2_par.out
2253078479eSJunchao Zhang      requires: !sycl kokkos_kernels
226039c6fbaSStefano Zampini      filter: grep -v " type:" | grep -v "Mat Object"
227f3482364SScott Kruger      args: -view -mat_type aijkokkos -mat_nonsym
228039c6fbaSStefano Zampini      diff_args: -j
229f3482364SScott Kruger      test:
230f3482364SScott Kruger        suffix: 2_par_kokkos_no_gpu_aware
231f3482364SScott Kruger        args: -use_gpu_aware_mpi 0
232f3482364SScott Kruger      test:
233f3482364SScott Kruger        requires: defined(HAVE_MPI_GPU_AWARE)
234f3482364SScott Kruger        suffix: 2_par_kokkos_gpu_aware
235f3482364SScott Kruger        args: -use_gpu_aware_mpi 1
236c4762a1bSJed Brown 
237c4762a1bSJed Brown TEST*/
238