1*c4762a1bSJed Brown 2*c4762a1bSJed Brown static char help[] = "Tests MatTranspose(), MatNorm(), MatAXPY() and MatAYPX().\n\n"; 3*c4762a1bSJed Brown 4*c4762a1bSJed Brown #include <petscmat.h> 5*c4762a1bSJed Brown 6*c4762a1bSJed Brown static PetscErrorCode TransposeAXPY(Mat C,PetscScalar alpha,Mat mat,PetscErrorCode (*f)(Mat,Mat*)) 7*c4762a1bSJed Brown { 8*c4762a1bSJed Brown Mat D,E,F,G; 9*c4762a1bSJed Brown PetscErrorCode ierr; 10*c4762a1bSJed Brown 11*c4762a1bSJed Brown PetscFunctionBegin; 12*c4762a1bSJed Brown if (f == MatCreateTranspose) { 13*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: (C^T)^T = (C^T)^T + alpha * A, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 14*c4762a1bSJed Brown } else { 15*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: (C^H)^H = (C^H)^H + alpha * A, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 16*c4762a1bSJed Brown } 17*c4762a1bSJed Brown ierr = MatDuplicate(mat,MAT_COPY_VALUES,&C);CHKERRQ(ierr); 18*c4762a1bSJed Brown ierr = f(C,&D);CHKERRQ(ierr); 19*c4762a1bSJed Brown ierr = f(D,&E);CHKERRQ(ierr); 20*c4762a1bSJed Brown ierr = MatAXPY(E,alpha,mat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 21*c4762a1bSJed Brown ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 22*c4762a1bSJed Brown ierr = MatDestroy(&E);CHKERRQ(ierr); 23*c4762a1bSJed Brown ierr = MatDestroy(&D);CHKERRQ(ierr); 24*c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 25*c4762a1bSJed Brown if (f == MatCreateTranspose) { 26*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: C = C + alpha * (A^T)^T, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 27*c4762a1bSJed Brown } else { 28*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: C = C + alpha * (A^H)^H, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 29*c4762a1bSJed Brown } 30*c4762a1bSJed Brown ierr = MatDuplicate(mat,MAT_COPY_VALUES,&C);CHKERRQ(ierr); 31*c4762a1bSJed Brown /* MATTRANSPOSE should have a MatTranspose_Transpose or MatTranspose_HT implementation */ 32*c4762a1bSJed Brown if (f == MatCreateTranspose) { 33*c4762a1bSJed Brown ierr = MatTranspose(mat,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr); 34*c4762a1bSJed Brown } else { 35*c4762a1bSJed Brown ierr = MatHermitianTranspose(mat,MAT_INITIAL_MATRIX,&D);CHKERRQ(ierr); 36*c4762a1bSJed Brown } 37*c4762a1bSJed Brown ierr = f(D,&E);CHKERRQ(ierr); 38*c4762a1bSJed Brown ierr = MatAXPY(C,alpha,E,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 39*c4762a1bSJed Brown ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 40*c4762a1bSJed Brown ierr = MatDestroy(&E);CHKERRQ(ierr); 41*c4762a1bSJed Brown ierr = MatDestroy(&D);CHKERRQ(ierr); 42*c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 43*c4762a1bSJed Brown if (f == MatCreateTranspose) { 44*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: (C^T)^T = (C^T)^T + alpha * (A^T)^T, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 45*c4762a1bSJed Brown } else { 46*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: (C^H)^H = (C^H)^H + alpha * (A^H)^H, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 47*c4762a1bSJed Brown } 48*c4762a1bSJed Brown ierr = MatDuplicate(mat,MAT_COPY_VALUES,&C);CHKERRQ(ierr); 49*c4762a1bSJed Brown ierr = f(C,&D);CHKERRQ(ierr); 50*c4762a1bSJed Brown ierr = f(D,&E);CHKERRQ(ierr); 51*c4762a1bSJed Brown ierr = f(mat,&F);CHKERRQ(ierr); 52*c4762a1bSJed Brown ierr = f(F,&G);CHKERRQ(ierr); 53*c4762a1bSJed Brown ierr = MatAXPY(E,alpha,G,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 54*c4762a1bSJed Brown ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 55*c4762a1bSJed Brown ierr = MatDestroy(&G);CHKERRQ(ierr); 56*c4762a1bSJed Brown ierr = MatDestroy(&F);CHKERRQ(ierr); 57*c4762a1bSJed Brown ierr = MatDestroy(&E);CHKERRQ(ierr); 58*c4762a1bSJed Brown ierr = MatDestroy(&D);CHKERRQ(ierr); 59*c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 60*c4762a1bSJed Brown PetscFunctionReturn(0); 61*c4762a1bSJed Brown } 62*c4762a1bSJed Brown 63*c4762a1bSJed Brown int main(int argc,char **argv) 64*c4762a1bSJed Brown { 65*c4762a1bSJed Brown Mat mat,tmat = 0; 66*c4762a1bSJed Brown PetscInt m = 7,n,i,j,rstart,rend,rect = 0; 67*c4762a1bSJed Brown PetscErrorCode ierr; 68*c4762a1bSJed Brown PetscMPIInt size,rank; 69*c4762a1bSJed Brown PetscBool flg; 70*c4762a1bSJed Brown PetscScalar v, alpha; 71*c4762a1bSJed Brown PetscReal normf,normi,norm1; 72*c4762a1bSJed Brown 73*c4762a1bSJed Brown ierr = PetscInitialize(&argc,&argv,(char*)0,help);if (ierr) return ierr; 74*c4762a1bSJed Brown ierr = PetscViewerPushFormat(PETSC_VIEWER_STDOUT_WORLD,PETSC_VIEWER_ASCII_COMMON);CHKERRQ(ierr); 75*c4762a1bSJed Brown ierr = PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL);CHKERRQ(ierr); 76*c4762a1bSJed Brown ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRQ(ierr); 77*c4762a1bSJed Brown ierr = MPI_Comm_size(PETSC_COMM_WORLD,&size);CHKERRQ(ierr); 78*c4762a1bSJed Brown n = m; 79*c4762a1bSJed Brown ierr = PetscOptionsHasName(NULL,NULL,"-rectA",&flg);CHKERRQ(ierr); 80*c4762a1bSJed Brown if (flg) {n += 2; rect = 1;} 81*c4762a1bSJed Brown ierr = PetscOptionsHasName(NULL,NULL,"-rectB",&flg);CHKERRQ(ierr); 82*c4762a1bSJed Brown if (flg) {n -= 2; rect = 1;} 83*c4762a1bSJed Brown 84*c4762a1bSJed Brown /* ------- Assemble matrix, test MatValid() --------- */ 85*c4762a1bSJed Brown ierr = MatCreate(PETSC_COMM_WORLD,&mat);CHKERRQ(ierr); 86*c4762a1bSJed Brown ierr = MatSetSizes(mat,PETSC_DECIDE,PETSC_DECIDE,m,n);CHKERRQ(ierr); 87*c4762a1bSJed Brown ierr = MatSetFromOptions(mat);CHKERRQ(ierr); 88*c4762a1bSJed Brown ierr = MatSetUp(mat);CHKERRQ(ierr); 89*c4762a1bSJed Brown ierr = MatGetOwnershipRange(mat,&rstart,&rend);CHKERRQ(ierr); 90*c4762a1bSJed Brown for (i=rstart; i<rend; i++) { 91*c4762a1bSJed Brown for (j=0; j<n; j++) { 92*c4762a1bSJed Brown v = 10.0*i+j; 93*c4762a1bSJed Brown ierr = MatSetValues(mat,1,&i,1,&j,&v,INSERT_VALUES);CHKERRQ(ierr); 94*c4762a1bSJed Brown } 95*c4762a1bSJed Brown } 96*c4762a1bSJed Brown ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 97*c4762a1bSJed Brown ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 98*c4762a1bSJed Brown 99*c4762a1bSJed Brown /* ----------------- Test MatNorm() ----------------- */ 100*c4762a1bSJed Brown ierr = MatNorm(mat,NORM_FROBENIUS,&normf);CHKERRQ(ierr); 101*c4762a1bSJed Brown ierr = MatNorm(mat,NORM_1,&norm1);CHKERRQ(ierr); 102*c4762a1bSJed Brown ierr = MatNorm(mat,NORM_INFINITY,&normi);CHKERRQ(ierr); 103*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"original A: Frobenious norm = %g, one norm = %g, infinity norm = %g\n",(double)normf,(double)norm1,(double)normi);CHKERRQ(ierr); 104*c4762a1bSJed Brown ierr = MatView(mat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 105*c4762a1bSJed Brown 106*c4762a1bSJed Brown /* --------------- Test MatTranspose() -------------- */ 107*c4762a1bSJed Brown ierr = PetscOptionsHasName(NULL,NULL,"-in_place",&flg);CHKERRQ(ierr); 108*c4762a1bSJed Brown if (!rect && flg) { 109*c4762a1bSJed Brown ierr = MatTranspose(mat,MAT_REUSE_MATRIX,&mat);CHKERRQ(ierr); /* in-place transpose */ 110*c4762a1bSJed Brown tmat = mat; mat = 0; 111*c4762a1bSJed Brown } else { /* out-of-place transpose */ 112*c4762a1bSJed Brown ierr = MatTranspose(mat,MAT_INITIAL_MATRIX,&tmat);CHKERRQ(ierr); 113*c4762a1bSJed Brown } 114*c4762a1bSJed Brown 115*c4762a1bSJed Brown /* ----------------- Test MatNorm() ----------------- */ 116*c4762a1bSJed Brown /* Print info about transpose matrix */ 117*c4762a1bSJed Brown ierr = MatNorm(tmat,NORM_FROBENIUS,&normf);CHKERRQ(ierr); 118*c4762a1bSJed Brown ierr = MatNorm(tmat,NORM_1,&norm1);CHKERRQ(ierr); 119*c4762a1bSJed Brown ierr = MatNorm(tmat,NORM_INFINITY,&normi);CHKERRQ(ierr); 120*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"B = A^T: Frobenious norm = %g, one norm = %g, infinity norm = %g\n",(double)normf,(double)norm1,(double)normi);CHKERRQ(ierr); 121*c4762a1bSJed Brown ierr = MatView(tmat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 122*c4762a1bSJed Brown 123*c4762a1bSJed Brown /* ----------------- Test MatAXPY(), MatAYPX() ----------------- */ 124*c4762a1bSJed Brown if (mat && !rect) { 125*c4762a1bSJed Brown alpha = 1.0; 126*c4762a1bSJed Brown ierr = PetscOptionsGetScalar(NULL,NULL,"-alpha",&alpha,NULL);CHKERRQ(ierr); 127*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: B = B + alpha * A\n");CHKERRQ(ierr); 128*c4762a1bSJed Brown ierr = MatAXPY(tmat,alpha,mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 129*c4762a1bSJed Brown ierr = MatView(tmat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 130*c4762a1bSJed Brown 131*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAYPX: B = alpha*B + A\n");CHKERRQ(ierr); 132*c4762a1bSJed Brown ierr = MatAYPX(tmat,alpha,mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 133*c4762a1bSJed Brown ierr = MatView(tmat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 134*c4762a1bSJed Brown } 135*c4762a1bSJed Brown 136*c4762a1bSJed Brown { 137*c4762a1bSJed Brown Mat C; 138*c4762a1bSJed Brown alpha = 1.0; 139*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: C = C + alpha * A, C=A, SAME_NONZERO_PATTERN\n");CHKERRQ(ierr); 140*c4762a1bSJed Brown ierr = MatDuplicate(mat,MAT_COPY_VALUES,&C);CHKERRQ(ierr); 141*c4762a1bSJed Brown ierr = MatAXPY(C,alpha,mat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 142*c4762a1bSJed Brown ierr = MatView(C,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 143*c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 144*c4762a1bSJed Brown ierr = TransposeAXPY(C,alpha,mat,MatCreateTranspose);CHKERRQ(ierr); 145*c4762a1bSJed Brown ierr = TransposeAXPY(C,alpha,mat,MatCreateHermitianTranspose);CHKERRQ(ierr); 146*c4762a1bSJed Brown } 147*c4762a1bSJed Brown 148*c4762a1bSJed Brown { 149*c4762a1bSJed Brown Mat matB; 150*c4762a1bSJed Brown /* get matB that has nonzeros of mat in all even numbers of row and col */ 151*c4762a1bSJed Brown ierr = MatCreate(PETSC_COMM_WORLD,&matB);CHKERRQ(ierr); 152*c4762a1bSJed Brown ierr = MatSetSizes(matB,PETSC_DECIDE,PETSC_DECIDE,m,n);CHKERRQ(ierr); 153*c4762a1bSJed Brown ierr = MatSetFromOptions(matB);CHKERRQ(ierr); 154*c4762a1bSJed Brown ierr = MatSetUp(matB);CHKERRQ(ierr); 155*c4762a1bSJed Brown ierr = MatGetOwnershipRange(matB,&rstart,&rend);CHKERRQ(ierr); 156*c4762a1bSJed Brown if (rstart % 2 != 0) rstart++; 157*c4762a1bSJed Brown for (i=rstart; i<rend; i += 2) { 158*c4762a1bSJed Brown for (j=0; j<n; j += 2) { 159*c4762a1bSJed Brown v = 10.0*i+j; 160*c4762a1bSJed Brown ierr = MatSetValues(matB,1,&i,1,&j,&v,INSERT_VALUES);CHKERRQ(ierr); 161*c4762a1bSJed Brown } 162*c4762a1bSJed Brown } 163*c4762a1bSJed Brown ierr = MatAssemblyBegin(matB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 164*c4762a1bSJed Brown ierr = MatAssemblyEnd(matB,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 165*c4762a1bSJed Brown PetscPrintf(PETSC_COMM_WORLD," A: original matrix:\n"); 166*c4762a1bSJed Brown ierr = MatView(mat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 167*c4762a1bSJed Brown PetscPrintf(PETSC_COMM_WORLD," B(a subset of A):\n"); 168*c4762a1bSJed Brown ierr = MatView(matB,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 169*c4762a1bSJed Brown ierr = PetscPrintf(PETSC_COMM_WORLD,"MatAXPY: B = B + alpha * A, SUBSET_NONZERO_PATTERN\n");CHKERRQ(ierr); 170*c4762a1bSJed Brown ierr = MatAXPY(mat,alpha,matB,SUBSET_NONZERO_PATTERN);CHKERRQ(ierr); 171*c4762a1bSJed Brown ierr = MatView(mat,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 172*c4762a1bSJed Brown ierr = MatDestroy(&matB);CHKERRQ(ierr); 173*c4762a1bSJed Brown } 174*c4762a1bSJed Brown 175*c4762a1bSJed Brown ierr = PetscViewerPopFormat(PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 176*c4762a1bSJed Brown /* Free data structures */ 177*c4762a1bSJed Brown ierr = MatDestroy(&mat);CHKERRQ(ierr); 178*c4762a1bSJed Brown ierr = MatDestroy(&tmat);CHKERRQ(ierr); 179*c4762a1bSJed Brown ierr = PetscFinalize(); 180*c4762a1bSJed Brown return ierr; 181*c4762a1bSJed Brown } 182*c4762a1bSJed Brown 183*c4762a1bSJed Brown 184*c4762a1bSJed Brown 185*c4762a1bSJed Brown 186*c4762a1bSJed Brown 187*c4762a1bSJed Brown /*TEST 188*c4762a1bSJed Brown 189*c4762a1bSJed Brown test: 190*c4762a1bSJed Brown suffix: 11_A 191*c4762a1bSJed Brown args: -mat_type seqaij -rectA 192*c4762a1bSJed Brown filter: grep -v "Mat Object" 193*c4762a1bSJed Brown 194*c4762a1bSJed Brown test: 195*c4762a1bSJed Brown suffix: 12_A 196*c4762a1bSJed Brown args: -mat_type seqdense -rectA 197*c4762a1bSJed Brown filter: grep -v "Mat Object" 198*c4762a1bSJed Brown 199*c4762a1bSJed Brown test: 200*c4762a1bSJed Brown suffix: 11_B 201*c4762a1bSJed Brown args: -mat_type seqaij -rectB 202*c4762a1bSJed Brown filter: grep -v "Mat Object" 203*c4762a1bSJed Brown 204*c4762a1bSJed Brown test: 205*c4762a1bSJed Brown suffix: 12_B 206*c4762a1bSJed Brown args: -mat_type seqdense -rectB 207*c4762a1bSJed Brown filter: grep -v "Mat Object" 208*c4762a1bSJed Brown 209*c4762a1bSJed Brown test: 210*c4762a1bSJed Brown suffix: 21 211*c4762a1bSJed Brown args: -mat_type mpiaij 212*c4762a1bSJed Brown 213*c4762a1bSJed Brown test: 214*c4762a1bSJed Brown suffix: 22 215*c4762a1bSJed Brown args: -mat_type mpidense 216*c4762a1bSJed Brown 217*c4762a1bSJed Brown test: 218*c4762a1bSJed Brown suffix: 23 219*c4762a1bSJed Brown nsize: 3 220*c4762a1bSJed Brown args: -mat_type mpiaij 221*c4762a1bSJed Brown filter: grep -v type | grep -v "MPI processes" 222*c4762a1bSJed Brown 223*c4762a1bSJed Brown test: 224*c4762a1bSJed Brown suffix: 24 225*c4762a1bSJed Brown nsize: 3 226*c4762a1bSJed Brown args: -mat_type mpidense 227*c4762a1bSJed Brown 228*c4762a1bSJed Brown test: 229*c4762a1bSJed Brown suffix: 2_aijcusparse_1 230*c4762a1bSJed Brown args: -mat_type mpiaijcusparse 231*c4762a1bSJed Brown output_file: output/ex2_23.out 232*c4762a1bSJed Brown requires: cuda 233*c4762a1bSJed Brown filter: grep -v type | grep -v "MPI processes" 234*c4762a1bSJed Brown 235*c4762a1bSJed Brown test: 236*c4762a1bSJed Brown suffix: 2_aijcusparse_2 237*c4762a1bSJed Brown nsize: 3 238*c4762a1bSJed Brown args: -mat_type mpiaijcusparse 239*c4762a1bSJed Brown output_file: output/ex2_23.out 240*c4762a1bSJed Brown requires: cuda 241*c4762a1bSJed Brown filter: grep -v type | grep -v "MPI processes" 242*c4762a1bSJed Brown 243*c4762a1bSJed Brown test: 244*c4762a1bSJed Brown suffix: 3 245*c4762a1bSJed Brown nsize: 2 246*c4762a1bSJed Brown args: -mat_type mpiaij -rectA 247*c4762a1bSJed Brown 248*c4762a1bSJed Brown test: 249*c4762a1bSJed Brown suffix: 3_aijcusparse 250*c4762a1bSJed Brown nsize: 2 251*c4762a1bSJed Brown args: -mat_type mpiaijcusparse -rectA 252*c4762a1bSJed Brown requires: cuda 253*c4762a1bSJed Brown 254*c4762a1bSJed Brown test: 255*c4762a1bSJed Brown suffix: 4 256*c4762a1bSJed Brown nsize: 2 257*c4762a1bSJed Brown args: -mat_type mpidense -rectA 258*c4762a1bSJed Brown 259*c4762a1bSJed Brown test: 260*c4762a1bSJed Brown suffix: aijcusparse_1 261*c4762a1bSJed Brown args: -mat_type seqaijcusparse -rectA 262*c4762a1bSJed Brown filter: grep -v "Mat Object" 263*c4762a1bSJed Brown output_file: output/ex2_11_A_aijcusparse.out 264*c4762a1bSJed Brown requires: cuda 265*c4762a1bSJed Brown 266*c4762a1bSJed Brown test: 267*c4762a1bSJed Brown suffix: aijcusparse_2 268*c4762a1bSJed Brown args: -mat_type seqaijcusparse -rectB 269*c4762a1bSJed Brown filter: grep -v "Mat Object" 270*c4762a1bSJed Brown output_file: output/ex2_11_B_aijcusparse.out 271*c4762a1bSJed Brown requires: cuda 272*c4762a1bSJed Brown 273*c4762a1bSJed Brown TEST*/ 274