1c4762a1bSJed Brown 2039c6fbaSStefano Zampini static char help[] = "Test MatAXPY()\n\n"; 3c4762a1bSJed Brown 4c4762a1bSJed Brown #include <petscmat.h> 5c4762a1bSJed Brown 6c4762a1bSJed Brown int main(int argc,char **args) 7c4762a1bSJed Brown { 8b84f494bSStefano Zampini Mat C,C1,C2,CU; 9c4762a1bSJed Brown PetscScalar v; 10c4762a1bSJed Brown PetscInt Ii,J,Istart,Iend; 11c4762a1bSJed Brown PetscErrorCode ierr; 12039c6fbaSStefano Zampini PetscInt i,j,m = 3,n; 13039c6fbaSStefano Zampini PetscMPIInt size; 14b84f494bSStefano Zampini PetscBool mat_nonsymmetric = PETSC_FALSE,flg; 15c4762a1bSJed Brown MatInfo info; 16c4762a1bSJed Brown 17c4762a1bSJed Brown ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 18c4762a1bSJed Brown ierr = PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL);CHKERRQ(ierr); 19ffc4695bSBarry Smith ierr = MPI_Comm_size(PETSC_COMM_WORLD,&size);CHKERRMPI(ierr); 20c4762a1bSJed Brown n = 2*size; 21c4762a1bSJed Brown 22c4762a1bSJed Brown /* Set flag if we are doing a nonsymmetric problem; the default is symmetric. */ 23c4762a1bSJed Brown ierr = PetscOptionsGetBool(NULL,NULL,"-mat_nonsym",&mat_nonsymmetric,NULL);CHKERRQ(ierr); 24c4762a1bSJed Brown 25c4762a1bSJed Brown ierr = MatCreate(PETSC_COMM_WORLD,&C);CHKERRQ(ierr); 26c4762a1bSJed Brown ierr = MatSetSizes(C,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n);CHKERRQ(ierr); 27c4762a1bSJed Brown ierr = MatSetFromOptions(C);CHKERRQ(ierr); 28c4762a1bSJed Brown ierr = MatSeqAIJSetPreallocation(C,5,NULL);CHKERRQ(ierr); 29039c6fbaSStefano Zampini ierr = MatMPIAIJSetPreallocation(C,5,NULL,5,NULL);CHKERRQ(ierr); 30c4762a1bSJed Brown 31c4762a1bSJed Brown ierr = MatGetOwnershipRange(C,&Istart,&Iend);CHKERRQ(ierr); 32c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 33c4762a1bSJed Brown v = -1.0; i = Ii/n; j = Ii - i*n; 34c4762a1bSJed Brown if (i>0) {J = Ii - n; ierr = MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES);CHKERRQ(ierr);} 35c4762a1bSJed Brown if (i<m-1) {J = Ii + n; ierr = MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES);CHKERRQ(ierr);} 36c4762a1bSJed Brown if (j>0) {J = Ii - 1; ierr = MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES);CHKERRQ(ierr);} 37c4762a1bSJed Brown if (j<n-1) {J = Ii + 1; ierr = MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES);CHKERRQ(ierr);} 38c4762a1bSJed Brown v = 4.0; ierr = MatSetValues(C,1,&Ii,1,&Ii,&v,ADD_VALUES);CHKERRQ(ierr); 39c4762a1bSJed Brown } 40c4762a1bSJed Brown 41c4762a1bSJed Brown /* Make the matrix nonsymmetric if desired */ 42c4762a1bSJed Brown if (mat_nonsymmetric) { 43c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 44c4762a1bSJed Brown v = -1.5; i = Ii/n; 45c4762a1bSJed Brown if (i>1) {J = Ii-n-1; ierr = MatSetValues(C,1,&Ii,1,&J,&v,ADD_VALUES);CHKERRQ(ierr);} 46c4762a1bSJed Brown } 47c4762a1bSJed Brown } else { 48c4762a1bSJed Brown ierr = MatSetOption(C,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 49c4762a1bSJed Brown ierr = MatSetOption(C,MAT_SYMMETRY_ETERNAL,PETSC_TRUE);CHKERRQ(ierr); 50c4762a1bSJed Brown } 51c4762a1bSJed Brown ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 52c4762a1bSJed Brown ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 53039c6fbaSStefano Zampini ierr = PetscObjectSetName((PetscObject)C,"C");CHKERRQ(ierr); 54039c6fbaSStefano Zampini ierr = MatViewFromOptions(C,NULL,"-view");CHKERRQ(ierr); 55c4762a1bSJed Brown 56b84f494bSStefano Zampini /* C1 = 2.0*C1 + C, C1 is anti-diagonal and has different non-zeros than C */ 57c4762a1bSJed Brown ierr = MatCreate(PETSC_COMM_WORLD,&C1);CHKERRQ(ierr); 58c4762a1bSJed Brown ierr = MatSetSizes(C1,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n);CHKERRQ(ierr); 59c4762a1bSJed Brown ierr = MatSetFromOptions(C1);CHKERRQ(ierr); 60c4762a1bSJed Brown ierr = MatSeqAIJSetPreallocation(C1,1,NULL);CHKERRQ(ierr); 61039c6fbaSStefano Zampini ierr = MatMPIAIJSetPreallocation(C1,1,NULL,1,NULL);CHKERRQ(ierr); 62c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 63039c6fbaSStefano Zampini v = 1.0; 64039c6fbaSStefano Zampini i = m*n - Ii -1; 65039c6fbaSStefano Zampini j = Ii; 66039c6fbaSStefano Zampini ierr = MatSetValues(C1,1,&i,1,&j,&v,ADD_VALUES);CHKERRQ(ierr); 67c4762a1bSJed Brown } 68c4762a1bSJed Brown ierr = MatAssemblyBegin(C1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 69c4762a1bSJed Brown ierr = MatAssemblyEnd(C1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 70039c6fbaSStefano Zampini ierr = PetscObjectSetName((PetscObject)C1,"C1");CHKERRQ(ierr); 71039c6fbaSStefano Zampini ierr = MatViewFromOptions(C1,NULL,"-view");CHKERRQ(ierr); 72b84f494bSStefano Zampini ierr = MatDuplicate(C1,MAT_COPY_VALUES,&CU);CHKERRQ(ierr); 73b84f494bSStefano Zampini 74c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN)...\n");CHKERRQ(ierr); 75c4762a1bSJed Brown ierr = MatAXPY(C1,2.0,C,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 76b84f494bSStefano Zampini ierr = MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN);CHKERRQ(ierr); 77c4762a1bSJed Brown ierr = MatGetInfo(C1,MAT_GLOBAL_SUM,&info);CHKERRQ(ierr); 78c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded);CHKERRQ(ierr); 79039c6fbaSStefano Zampini ierr = MatViewFromOptions(C1,NULL,"-view");CHKERRQ(ierr); 80b84f494bSStefano Zampini ierr = MatMultEqual(CU,C1,10,&flg);CHKERRQ(ierr); 81b84f494bSStefano Zampini if (!flg) { 82b84f494bSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly DIFFERENT_NONZERO_PATTERN)\n");CHKERRQ(ierr); 83b84f494bSStefano Zampini ierr = MatViewFromOptions(CU,NULL,"-view");CHKERRQ(ierr); 84b84f494bSStefano Zampini } 85b84f494bSStefano Zampini ierr = MatDestroy(&CU);CHKERRQ(ierr); 86c4762a1bSJed Brown 87b84f494bSStefano Zampini /* Secondly, compute C1 = 2.0*C2 + C1, C2 has non-zero pattern of C */ 88c4762a1bSJed Brown ierr = MatDuplicate(C,MAT_DO_NOT_COPY_VALUES,&C2);CHKERRQ(ierr); 89b84f494bSStefano Zampini ierr = MatDuplicate(C1,MAT_COPY_VALUES,&CU);CHKERRQ(ierr); 90c4762a1bSJed Brown 91c4762a1bSJed Brown for (Ii=Istart; Ii<Iend; Ii++) { 92c4762a1bSJed Brown v = 1.0; 93c4762a1bSJed Brown ierr = MatSetValues(C2,1,&Ii,1,&Ii,&v,ADD_VALUES);CHKERRQ(ierr); 94c4762a1bSJed Brown } 95c4762a1bSJed Brown ierr = MatAssemblyBegin(C2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 96c4762a1bSJed Brown ierr = MatAssemblyEnd(C2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 97039c6fbaSStefano Zampini ierr = PetscObjectSetName((PetscObject)C2,"C2");CHKERRQ(ierr); 98039c6fbaSStefano Zampini ierr = MatViewFromOptions(C2,NULL,"-view");CHKERRQ(ierr); 99039c6fbaSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN)...\n");CHKERRQ(ierr); 100039c6fbaSStefano Zampini ierr = MatAXPY(C1,2.0,C2,SUBSET_NONZERO_PATTERN);CHKERRQ(ierr); 101b84f494bSStefano Zampini ierr = MatAXPY(CU,2.0,C2,UNKNOWN_NONZERO_PATTERN);CHKERRQ(ierr); 102039c6fbaSStefano Zampini ierr = MatGetInfo(C1,MAT_GLOBAL_SUM,&info);CHKERRQ(ierr); 103039c6fbaSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD," C1: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded);CHKERRQ(ierr); 104039c6fbaSStefano Zampini ierr = MatViewFromOptions(C1,NULL,"-view");CHKERRQ(ierr); 105b84f494bSStefano Zampini ierr = MatMultEqual(CU,C1,10,&flg);CHKERRQ(ierr); 106b84f494bSStefano Zampini if (!flg) { 107b84f494bSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n");CHKERRQ(ierr); 108b84f494bSStefano Zampini ierr = MatViewFromOptions(CU,NULL,"-view");CHKERRQ(ierr); 109b84f494bSStefano Zampini } 110b84f494bSStefano Zampini ierr = MatDestroy(&CU);CHKERRQ(ierr); 111039c6fbaSStefano Zampini 112b84f494bSStefano Zampini /* Test SAME_NONZERO_PATTERN computing C2 = C2 + 2.0 * C */ 113b84f494bSStefano Zampini ierr = MatDuplicate(C2,MAT_COPY_VALUES,&CU);CHKERRQ(ierr); 114039c6fbaSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD," MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN)...\n");CHKERRQ(ierr); 115b84f494bSStefano Zampini ierr = MatAXPY(C2,2.0,C,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 116b84f494bSStefano Zampini ierr = MatAXPY(CU,2.0,C,UNKNOWN_NONZERO_PATTERN);CHKERRQ(ierr); 117c4762a1bSJed Brown ierr = MatGetInfo(C2,MAT_GLOBAL_SUM,&info);CHKERRQ(ierr); 118c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD," C2: nz_allocated = %g; nz_used = %g; nz_unneeded = %g\n",info.nz_allocated,info.nz_used, info.nz_unneeded);CHKERRQ(ierr); 119039c6fbaSStefano Zampini ierr = MatViewFromOptions(C2,NULL,"-view");CHKERRQ(ierr); 120b84f494bSStefano Zampini ierr = MatMultEqual(CU,C2,10,&flg);CHKERRQ(ierr); 121b84f494bSStefano Zampini if (!flg) { 122b84f494bSStefano Zampini ierr = PetscPrintf(PETSC_COMM_WORLD,"Error UNKNOWN_NONZERO_PATTERN (supposedly SUBSET_NONZERO_PATTERN)\n");CHKERRQ(ierr); 123b84f494bSStefano Zampini ierr = MatViewFromOptions(CU,NULL,"-view");CHKERRQ(ierr); 124b84f494bSStefano Zampini } 125b84f494bSStefano Zampini ierr = MatDestroy(&CU);CHKERRQ(ierr); 126c4762a1bSJed Brown 127c4762a1bSJed Brown ierr = MatDestroy(&C1);CHKERRQ(ierr); 128c4762a1bSJed Brown ierr = MatDestroy(&C2);CHKERRQ(ierr); 129c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 130c4762a1bSJed Brown 131c4762a1bSJed Brown ierr = PetscFinalize(); 132c4762a1bSJed Brown return ierr; 133c4762a1bSJed Brown } 134c4762a1bSJed Brown 135c4762a1bSJed Brown /*TEST 136c4762a1bSJed Brown 137c4762a1bSJed Brown test: 138039c6fbaSStefano Zampini suffix: 1 139039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 140039c6fbaSStefano Zampini args: -view 141039c6fbaSStefano Zampini diff_args: -j 142039c6fbaSStefano Zampini 143039c6fbaSStefano Zampini test: 144039c6fbaSStefano Zampini output_file: output/ex132_1.out 145039c6fbaSStefano Zampini requires: cuda 146039c6fbaSStefano Zampini suffix: 1_cuda 147039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 148039c6fbaSStefano Zampini args: -view -mat_type aijcusparse 149039c6fbaSStefano Zampini diff_args: -j 150039c6fbaSStefano Zampini 151039c6fbaSStefano Zampini test: 152039c6fbaSStefano Zampini output_file: output/ex132_1.out 153039c6fbaSStefano Zampini requires: kokkos_kernels 154039c6fbaSStefano Zampini suffix: 1_kokkos 155039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 156039c6fbaSStefano Zampini args: -view -mat_type aijkokkos 157039c6fbaSStefano Zampini diff_args: -j 158039c6fbaSStefano Zampini 159039c6fbaSStefano Zampini test: 160039c6fbaSStefano Zampini suffix: 2 161039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 162039c6fbaSStefano Zampini args: -view -mat_nonsym 163039c6fbaSStefano Zampini diff_args: -j 164039c6fbaSStefano Zampini 165039c6fbaSStefano Zampini test: 166039c6fbaSStefano Zampini output_file: output/ex132_2.out 167039c6fbaSStefano Zampini requires: cuda 168039c6fbaSStefano Zampini suffix: 2_cuda 169039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 170039c6fbaSStefano Zampini args: -view -mat_type aijcusparse -mat_nonsym 171039c6fbaSStefano Zampini diff_args: -j 172039c6fbaSStefano Zampini 173039c6fbaSStefano Zampini test: 174039c6fbaSStefano Zampini output_file: output/ex132_2.out 175039c6fbaSStefano Zampini requires: kokkos_kernels 176039c6fbaSStefano Zampini suffix: 2_kokkos 177039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 178039c6fbaSStefano Zampini args: -view -mat_type aijkokkos -mat_nonsym 179039c6fbaSStefano Zampini diff_args: -j 180039c6fbaSStefano Zampini 181039c6fbaSStefano Zampini test: 182039c6fbaSStefano Zampini nsize: 2 183039c6fbaSStefano Zampini suffix: 1_par 184039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 185039c6fbaSStefano Zampini args: -view 186039c6fbaSStefano Zampini diff_args: -j 187039c6fbaSStefano Zampini 188039c6fbaSStefano Zampini test: 189039c6fbaSStefano Zampini nsize: 2 190039c6fbaSStefano Zampini output_file: output/ex132_1_par.out 191039c6fbaSStefano Zampini requires: cuda 192039c6fbaSStefano Zampini suffix: 1_par_cuda 193039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 194039c6fbaSStefano Zampini args: -view -mat_type aijcusparse 195039c6fbaSStefano Zampini diff_args: -j 196039c6fbaSStefano Zampini 197039c6fbaSStefano Zampini test: 198039c6fbaSStefano Zampini nsize: 2 199039c6fbaSStefano Zampini output_file: output/ex132_1_par.out 200*3078479eSJunchao Zhang requires: !sycl kokkos_kernels 201039c6fbaSStefano Zampini suffix: 1_par_kokkos 202039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 203039c6fbaSStefano Zampini args: -view -mat_type aijkokkos 204039c6fbaSStefano Zampini diff_args: -j 205039c6fbaSStefano Zampini 206039c6fbaSStefano Zampini test: 207039c6fbaSStefano Zampini nsize: 2 208039c6fbaSStefano Zampini suffix: 2_par 209039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 210039c6fbaSStefano Zampini args: -view -mat_nonsym 211039c6fbaSStefano Zampini diff_args: -j 212039c6fbaSStefano Zampini 213039c6fbaSStefano Zampini test: 214039c6fbaSStefano Zampini nsize: 2 215039c6fbaSStefano Zampini output_file: output/ex132_2_par.out 216039c6fbaSStefano Zampini requires: cuda 217039c6fbaSStefano Zampini suffix: 2_par_cuda 218039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 219039c6fbaSStefano Zampini args: -view -mat_type aijcusparse -mat_nonsym 220039c6fbaSStefano Zampini diff_args: -j 221039c6fbaSStefano Zampini 222039c6fbaSStefano Zampini test: 223039c6fbaSStefano Zampini nsize: 2 224039c6fbaSStefano Zampini output_file: output/ex132_2_par.out 225*3078479eSJunchao Zhang requires: !sycl kokkos_kernels 226039c6fbaSStefano Zampini suffix: 2_par_kokkos 227039c6fbaSStefano Zampini filter: grep -v " type:" | grep -v "Mat Object" 22883567821SJunchao Zhang args: -view -mat_type aijkokkos -mat_nonsym -use_gpu_aware_mpi {{0 1}} 229039c6fbaSStefano Zampini diff_args: -j 230c4762a1bSJed Brown 231c4762a1bSJed Brown TEST*/ 232