1*076ba34aSJunchao Zhang static char help[] = "Test Mat products \n\n"; 2*076ba34aSJunchao Zhang 3*076ba34aSJunchao Zhang #include <petscmat.h> 4*076ba34aSJunchao Zhang int main(int argc,char **args) 5*076ba34aSJunchao Zhang { 6*076ba34aSJunchao Zhang Mat A=NULL,B=NULL,C=NULL,D=NULL,E=NULL; 7*076ba34aSJunchao Zhang PetscErrorCode ierr; 8*076ba34aSJunchao Zhang PetscInt k; 9*076ba34aSJunchao Zhang const PetscInt M = 18,N = 18; 10*076ba34aSJunchao Zhang PetscMPIInt rank; 11*076ba34aSJunchao Zhang 12*076ba34aSJunchao Zhang /* A, B are 18 x 18 nonsymmetric matrices and have the same sparsity pattern but different values. 13*076ba34aSJunchao Zhang Big enough to have complex communication patterns but still small enough for debugging. 14*076ba34aSJunchao Zhang */ 15*076ba34aSJunchao Zhang PetscInt Ai[] = {0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 13, 13, 13, 14, 14, 15, 15, 16, 16, 17, 17}; 16*076ba34aSJunchao Zhang PetscInt Aj[] = {0, 1, 2, 7, 3, 8, 4, 9, 5, 8, 2, 6, 11, 0, 7, 1, 6, 2, 4, 10, 16, 11, 15, 12, 17, 12, 13, 14, 15, 17, 11, 13, 3, 16, 9, 15, 11, 13}; 17*076ba34aSJunchao Zhang PetscInt Bi[] = {0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 13, 13, 13, 14, 14, 15, 15, 16, 16, 17, 17}; 18*076ba34aSJunchao Zhang PetscInt Bj[] = {0, 1, 2, 7, 3, 8, 4, 9, 5, 8, 2, 6, 11, 0, 7, 1, 6, 2, 4, 10, 16, 11, 15, 12, 17, 12, 13, 14, 15, 17, 11, 13, 3, 16, 9, 15, 11, 13}; 19*076ba34aSJunchao Zhang 20*076ba34aSJunchao Zhang PetscInt Annz = sizeof(Ai)/sizeof(PetscInt); 21*076ba34aSJunchao Zhang PetscInt Bnnz = sizeof(Bi)/sizeof(PetscInt); 22*076ba34aSJunchao Zhang 23*076ba34aSJunchao Zhang ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 24*076ba34aSJunchao Zhang ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRMPI(ierr); 25*076ba34aSJunchao Zhang 26*076ba34aSJunchao Zhang ierr = MatCreate(PETSC_COMM_WORLD,&A);CHKERRQ(ierr); 27*076ba34aSJunchao Zhang ierr = MatSetSizes(A,PETSC_DECIDE,PETSC_DECIDE,M,N); 28*076ba34aSJunchao Zhang ierr = MatSetFromOptions(A);CHKERRQ(ierr); 29*076ba34aSJunchao Zhang ierr = MatSeqAIJSetPreallocation(A,2,NULL); 30*076ba34aSJunchao Zhang ierr = MatMPIAIJSetPreallocation(A,2,NULL,2,NULL);CHKERRQ(ierr); 31*076ba34aSJunchao Zhang ierr = MatSetOption(A,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 32*076ba34aSJunchao Zhang 33*076ba34aSJunchao Zhang if (rank == 0) { 34*076ba34aSJunchao Zhang for (k=0; k<Annz; k++) {ierr = MatSetValue(A,Ai[k],Aj[k],Ai[k]+Aj[k]+1.0,INSERT_VALUES);CHKERRQ(ierr);} 35*076ba34aSJunchao Zhang } 36*076ba34aSJunchao Zhang 37*076ba34aSJunchao Zhang ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 38*076ba34aSJunchao Zhang ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 39*076ba34aSJunchao Zhang 40*076ba34aSJunchao Zhang ierr = MatCreate(PETSC_COMM_WORLD,&B);CHKERRQ(ierr); 41*076ba34aSJunchao Zhang ierr = MatSetSizes(B,PETSC_DECIDE,PETSC_DECIDE,M,N); 42*076ba34aSJunchao Zhang ierr = MatSetFromOptions(B);CHKERRQ(ierr); 43*076ba34aSJunchao Zhang ierr = MatSeqAIJSetPreallocation(B,2,NULL); 44*076ba34aSJunchao Zhang ierr = MatMPIAIJSetPreallocation(B,2,NULL,2,NULL);CHKERRQ(ierr); 45*076ba34aSJunchao Zhang ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 46*076ba34aSJunchao Zhang 47*076ba34aSJunchao Zhang if (rank == 0) { 48*076ba34aSJunchao Zhang for (k=0; k<Bnnz; k++) {ierr = MatSetValue(B,Bi[k],Bj[k],Bi[k]+Bj[k]+2.0,INSERT_VALUES);CHKERRQ(ierr);} 49*076ba34aSJunchao Zhang } 50*076ba34aSJunchao Zhang ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 51*076ba34aSJunchao Zhang ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 52*076ba34aSJunchao Zhang 53*076ba34aSJunchao Zhang ierr = MatMatMult(A,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&C);CHKERRQ(ierr); 54*076ba34aSJunchao Zhang ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 55*076ba34aSJunchao Zhang 56*076ba34aSJunchao Zhang /* B, A have the same nonzero pattern, so it is legitimate to do so */ 57*076ba34aSJunchao Zhang ierr = MatMatMult(B,A,MAT_REUSE_MATRIX,PETSC_DEFAULT,&C);CHKERRQ(ierr); 58*076ba34aSJunchao Zhang ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 59*076ba34aSJunchao Zhang 60*076ba34aSJunchao Zhang ierr = MatTransposeMatMult(A,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&D);CHKERRQ(ierr); 61*076ba34aSJunchao Zhang ierr = MatView(D, PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 62*076ba34aSJunchao Zhang 63*076ba34aSJunchao Zhang ierr = MatPtAP(A,B,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&E);CHKERRQ(ierr); 64*076ba34aSJunchao Zhang ierr = MatView(E,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 65*076ba34aSJunchao Zhang 66*076ba34aSJunchao Zhang ierr = MatDestroy(&A);CHKERRQ(ierr); 67*076ba34aSJunchao Zhang ierr = MatDestroy(&B);CHKERRQ(ierr); 68*076ba34aSJunchao Zhang ierr = MatDestroy(&C);CHKERRQ(ierr); 69*076ba34aSJunchao Zhang ierr = MatDestroy(&D);CHKERRQ(ierr); 70*076ba34aSJunchao Zhang ierr = MatDestroy(&E);CHKERRQ(ierr); 71*076ba34aSJunchao Zhang 72*076ba34aSJunchao Zhang ierr = PetscFinalize(); 73*076ba34aSJunchao Zhang return ierr; 74*076ba34aSJunchao Zhang } 75*076ba34aSJunchao Zhang 76*076ba34aSJunchao Zhang /*TEST 77*076ba34aSJunchao Zhang testset: 78*076ba34aSJunchao Zhang filter: grep -ve type -ve "Mat Object" 79*076ba34aSJunchao Zhang output_file: output/ex250_1.out 80*076ba34aSJunchao Zhang 81*076ba34aSJunchao Zhang test: 82*076ba34aSJunchao Zhang suffix: 1 83*076ba34aSJunchao Zhang nsize: {{1 3}} 84*076ba34aSJunchao Zhang args: -mat_type aij 85*076ba34aSJunchao Zhang 86*076ba34aSJunchao Zhang test: 87*076ba34aSJunchao Zhang suffix: 2 88*076ba34aSJunchao Zhang nsize: {{3 4}} 89*076ba34aSJunchao Zhang args: -mat_type aij -matmatmult_via backend -matptap_via backend -mattransposematmult_via backend 90*076ba34aSJunchao Zhang 91*076ba34aSJunchao Zhang test: 92*076ba34aSJunchao Zhang suffix: cuda 93*076ba34aSJunchao Zhang requires: cuda 94*076ba34aSJunchao Zhang nsize: {{1 3 4}} 95*076ba34aSJunchao Zhang args: -mat_type aijcusparse 96*076ba34aSJunchao Zhang 97*076ba34aSJunchao Zhang test: 98*076ba34aSJunchao Zhang suffix: kok 99*076ba34aSJunchao Zhang requires: kokkos_kernels 100*076ba34aSJunchao Zhang nsize: {{1 3 4}} 101*076ba34aSJunchao Zhang args: -mat_type aijkokkos 102*076ba34aSJunchao Zhang 103*076ba34aSJunchao Zhang TEST*/ 104*076ba34aSJunchao Zhang 105