1c4762a1bSJed Brown 2039c6fbaSStefano Zampini static char help[] = "Test MatAXPY()\n\n"; 3c4762a1bSJed Brown 4c4762a1bSJed Brown #include <petscmat.h> 5c4762a1bSJed Brown 6c4762a1bSJed Brown int main(int argc,char **args) 7c4762a1bSJed Brown { 8b84f494bSStefano Zampini Mat C,C1,C2,CU; 9c4762a1bSJed Brown PetscScalar v; 10c4762a1bSJed Brown PetscInt Ii,J,Istart,Iend; 11039c6fbaSStefano Zampini PetscInt i,j,m = 3,n; 12039c6fbaSStefano Zampini PetscMPIInt size; 13b84f494bSStefano Zampini PetscBool mat_nonsymmetric = PETSC_FALSE,flg; 14c4762a1bSJed Brown MatInfo info; 15c4762a1bSJed Brown 16*9566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc,&args,(char*)0,help)); 17*9566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL)); 18*9566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 19c4762a1bSJed Brown n = 2*size; 20c4762a1bSJed Brown 21c4762a1bSJed Brown /* Set flag if we are doing a nonsymmetric problem; the default is symmetric. */ 22*9566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL,NULL,"-mat_nonsym",&mat_nonsymmetric,NULL)); 23c4762a1bSJed Brown 24*9566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_WORLD,&C)); 25*9566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n)); 26*9566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(C)); 27*9566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C,5,NULL)); 28*9566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(C,5,NULL,5,NULL)); 29c4762a1bSJed Brown 30*9566063dSJacob Faibussowitsch PetscCall(MatGetOwnershipRange(C,&Istart,&Iend)); 31c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 32c4762a1bSJed Brown v = -1.0; i = Ii/n; j = Ii - i*n; 33*9566063dSJacob Faibussowitsch if (i>0) {J = Ii - n; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));} 34*9566063dSJacob Faibussowitsch if (i<m-1) {J = Ii + n; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));} 35*9566063dSJacob Faibussowitsch if (j>0) {J = Ii - 1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));} 36*9566063dSJacob Faibussowitsch if (j<n-1) {J = Ii + 1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));} 37*9566063dSJacob Faibussowitsch v = 4.0; PetscCall(MatSetValues(C,1,&Ii,1,&Ii,&v,ADD_VALUES)); 38c4762a1bSJed Brown } 39c4762a1bSJed Brown 40c4762a1bSJed Brown /* Make the matrix nonsymmetric if desired */ 41c4762a1bSJed Brown if (mat_nonsymmetric) { 42c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 43c4762a1bSJed Brown v = -1.5; i = Ii/n; 44*9566063dSJacob Faibussowitsch if (i>1) {J = Ii-n-1; PetscCall(MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES));} 45c4762a1bSJed Brown } 46c4762a1bSJed Brown } else { 47*9566063dSJacob Faibussowitsch PetscCall(MatSetOption(C,MAT_SYMMETRIC,PETSC_TRUE)); 48*9566063dSJacob Faibussowitsch PetscCall(MatSetOption(C,MAT_SYMMETRY_ETERNAL,PETSC_TRUE)); 49c4762a1bSJed Brown } 50*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY)); 51*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY)); 52*9566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)C,"C")); 53*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C,NULL,"-view")); 54c4762a1bSJed Brown 55b84f494bSStefano Zampini /* C1 = 2.0*C1 + C, C1 is anti-diagonal and has different non-zeros than C */ 56*9566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_WORLD,&C1)); 57*9566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C1,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n)); 58*9566063dSJacob Faibussowitsch PetscCall(MatSetFromOptions(C1)); 59*9566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C1,1,NULL)); 60*9566063dSJacob Faibussowitsch PetscCall(MatMPIAIJSetPreallocation(C1,1,NULL,1,NULL)); 61c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 62039c6fbaSStefano Zampini v = 1.0; 63039c6fbaSStefano Zampini i = m*n - Ii -1; 64039c6fbaSStefano Zampini j = Ii; 65*9566063dSJacob Faibussowitsch PetscCall(MatSetValues(C1,1,&i,1,&j,&v,ADD_VALUES)); 66c4762a1bSJed Brown } 67*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C1,MAT_FINAL_ASSEMBLY)); 68*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C1,MAT_FINAL_ASSEMBLY)); 69*9566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)C1,"C1")); 70*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C1,NULL,"-view")); 71*9566063dSJacob Faibussowitsch PetscCall(MatDuplicate(C1,MAT_COPY_VALUES,&CU)); 72b84f494bSStefano Zampini 73*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN)...\n")); 74*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN)); 75*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN)); 76*9566063dSJacob Faibussowitsch PetscCall(MatGetInfo(C1,MAT_GLOBAL_SUM,&info)); 77*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded)); 78*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C1,NULL,"-view")); 79*9566063dSJacob Faibussowitsch PetscCall(MatMultEqual(CU,C1,10,&flg)); 80b84f494bSStefano Zampini if (!flg) { 81*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly DIFFERENT_NONZERO_PATTERN)\n")); 82*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(CU,NULL,"-view")); 83b84f494bSStefano Zampini } 84*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&CU)); 85c4762a1bSJed Brown 86b84f494bSStefano Zampini /* Secondly, compute C1 = 2.0*C2 + C1, C2 has non-zero pattern of C */ 87*9566063dSJacob Faibussowitsch PetscCall(MatDuplicate(C,MAT_DO_NOT_COPY_VALUES,&C2)); 88*9566063dSJacob Faibussowitsch PetscCall(MatDuplicate(C1,MAT_COPY_VALUES,&CU)); 89c4762a1bSJed Brown 90c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 91c4762a1bSJed Brown v = 1.0; 92*9566063dSJacob Faibussowitsch PetscCall(MatSetValues(C2,1,&Ii,1,&Ii,&v,ADD_VALUES)); 93c4762a1bSJed Brown } 94*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C2,MAT_FINAL_ASSEMBLY)); 95*9566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C2,MAT_FINAL_ASSEMBLY)); 96*9566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)C2,"C2")); 97*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C2,NULL,"-view")); 98*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN)...\n")); 99*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN)); 100*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(CU,2.0,C2,UNKNOWN_NONZERO_PATTERN)); 101*9566063dSJacob Faibussowitsch PetscCall(MatGetInfo(C1,MAT_GLOBAL_SUM,&info)); 102*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded)); 103*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C1,NULL,"-view")); 104*9566063dSJacob Faibussowitsch PetscCall(MatMultEqual(CU,C1,10,&flg)); 105b84f494bSStefano Zampini if (!flg) { 106*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n")); 107*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(CU,NULL,"-view")); 108b84f494bSStefano Zampini } 109*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&CU)); 110039c6fbaSStefano Zampini 111b84f494bSStefano Zampini /* Test SAME_NONZERO_PATTERN computing C2 = C2 + 2.0 * C */ 112*9566063dSJacob Faibussowitsch PetscCall(MatDuplicate(C2,MAT_COPY_VALUES,&CU)); 113*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN)...\n")); 114*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN)); 115*9566063dSJacob Faibussowitsch PetscCall(MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN)); 116*9566063dSJacob Faibussowitsch PetscCall(MatGetInfo(C2,MAT_GLOBAL_SUM,&info)); 117*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD," C2: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded)); 118*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(C2,NULL,"-view")); 119*9566063dSJacob Faibussowitsch PetscCall(MatMultEqual(CU,C2,10,&flg)); 120b84f494bSStefano Zampini if (!flg) { 121*9566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n")); 122*9566063dSJacob Faibussowitsch PetscCall(MatViewFromOptions(CU,NULL,"-view")); 123b84f494bSStefano Zampini } 124*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&CU)); 125c4762a1bSJed Brown 126*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C1)); 127*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C2)); 128*9566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 129c4762a1bSJed Brown 130*9566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 131b122ec5aSJacob Faibussowitsch return 0; 132c4762a1bSJed Brown } 133c4762a1bSJed Brown 134c4762a1bSJed Brown /*TEST 135c4762a1bSJed Brown 136c4762a1bSJed Brown test: 137039c6fbaSStefano Zampini suffix: 1 138039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 139039c6fbaSStefano Zampini args: -view 140039c6fbaSStefano Zampini diff_args: -j 141039c6fbaSStefano Zampini 142039c6fbaSStefano Zampini test: 143039c6fbaSStefano Zampini output_file: output/ex132_1.out 144039c6fbaSStefano Zampini requires: cuda 145039c6fbaSStefano Zampini suffix: 1_cuda 146039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 147039c6fbaSStefano Zampini args: -view -mat_type aijcusparse 148039c6fbaSStefano Zampini diff_args: -j 149039c6fbaSStefano Zampini 150039c6fbaSStefano Zampini test: 151039c6fbaSStefano Zampini output_file: output/ex132_1.out 152039c6fbaSStefano Zampini requires: kokkos_kernels 153039c6fbaSStefano Zampini suffix: 1_kokkos 154039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 155039c6fbaSStefano Zampini args: -view -mat_type aijkokkos 156039c6fbaSStefano Zampini diff_args: -j 157039c6fbaSStefano Zampini 158039c6fbaSStefano Zampini test: 159039c6fbaSStefano Zampini suffix: 2 160039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 161039c6fbaSStefano Zampini args: -view -mat_nonsym 162039c6fbaSStefano Zampini diff_args: -j 163039c6fbaSStefano Zampini 164039c6fbaSStefano Zampini test: 165039c6fbaSStefano Zampini output_file: output/ex132_2.out 166039c6fbaSStefano Zampini requires: cuda 167039c6fbaSStefano Zampini suffix: 2_cuda 168039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 169039c6fbaSStefano Zampini args: -view -mat_type aijcusparse -mat_nonsym 170039c6fbaSStefano Zampini diff_args: -j 171039c6fbaSStefano Zampini 172039c6fbaSStefano Zampini test: 173039c6fbaSStefano Zampini output_file: output/ex132_2.out 174039c6fbaSStefano Zampini requires: kokkos_kernels 175039c6fbaSStefano Zampini suffix: 2_kokkos 176039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 177039c6fbaSStefano Zampini args: -view -mat_type aijkokkos -mat_nonsym 178039c6fbaSStefano Zampini diff_args: -j 179039c6fbaSStefano Zampini 180039c6fbaSStefano Zampini test: 181039c6fbaSStefano Zampini nsize: 2 182039c6fbaSStefano Zampini suffix: 1_par 183039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 184039c6fbaSStefano Zampini args: -view 185039c6fbaSStefano Zampini diff_args: -j 186039c6fbaSStefano Zampini 187039c6fbaSStefano Zampini test: 188039c6fbaSStefano Zampini nsize: 2 189039c6fbaSStefano Zampini output_file: output/ex132_1_par.out 190039c6fbaSStefano Zampini requires: cuda 191039c6fbaSStefano Zampini suffix: 1_par_cuda 192039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 193039c6fbaSStefano Zampini args: -view -mat_type aijcusparse 194039c6fbaSStefano Zampini diff_args: -j 195039c6fbaSStefano Zampini 196039c6fbaSStefano Zampini test: 197039c6fbaSStefano Zampini nsize: 2 198039c6fbaSStefano Zampini output_file: output/ex132_1_par.out 1993078479eSJunchao Zhang requires: !sycl kokkos_kernels 200039c6fbaSStefano Zampini suffix: 1_par_kokkos 201039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 202039c6fbaSStefano Zampini args: -view -mat_type aijkokkos 203039c6fbaSStefano Zampini diff_args: -j 204039c6fbaSStefano Zampini 205039c6fbaSStefano Zampini test: 206039c6fbaSStefano Zampini nsize: 2 207039c6fbaSStefano Zampini suffix: 2_par 208039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 209039c6fbaSStefano Zampini args: -view -mat_nonsym 210039c6fbaSStefano Zampini diff_args: -j 211039c6fbaSStefano Zampini 212039c6fbaSStefano Zampini test: 213039c6fbaSStefano Zampini nsize: 2 214039c6fbaSStefano Zampini output_file: output/ex132_2_par.out 215039c6fbaSStefano Zampini requires: cuda 216039c6fbaSStefano Zampini suffix: 2_par_cuda 217039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 218039c6fbaSStefano Zampini args: -view -mat_type aijcusparse -mat_nonsym 219039c6fbaSStefano Zampini diff_args: -j 220039c6fbaSStefano Zampini 221f3482364SScott Kruger testset: 222039c6fbaSStefano Zampini nsize: 2 223039c6fbaSStefano Zampini output_file: output/ex132_2_par.out 2243078479eSJunchao Zhang requires: !sycl kokkos_kernels 225039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 226f3482364SScott Kruger args: -view -mat_type aijkokkos -mat_nonsym 227039c6fbaSStefano Zampini diff_args: -j 228f3482364SScott Kruger test: 229f3482364SScott Kruger suffix: 2_par_kokkos_no_gpu_aware 230f3482364SScott Kruger args: -use_gpu_aware_mpi 0 231f3482364SScott Kruger test: 232f3482364SScott Kruger requires: defined(HAVE_MPI_GPU_AWARE) 233f3482364SScott Kruger suffix: 2_par_kokkos_gpu_aware 234f3482364SScott Kruger args: -use_gpu_aware_mpi 1 235c4762a1bSJed Brown 236c4762a1bSJed Brown TEST*/ 237