xref: /petsc/src/mat/tests/ex301.c (revision 327415f76d85372a4417cf1aaa14db707d4d6c04)
1c4762a1bSJed Brown 
2c4762a1bSJed Brown static char help[] = "Tests for bugs in A->offloadmask consistency for GPU matrices\n\n";
3c4762a1bSJed Brown 
4c4762a1bSJed Brown #include <petscmat.h>
5c4762a1bSJed Brown 
6c4762a1bSJed Brown int main(int argc,char **args)
7c4762a1bSJed Brown {
8c4762a1bSJed Brown   Mat            A;
9c4762a1bSJed Brown   PetscInt       i,j,rstart,rend,m = 3;
10c4762a1bSJed Brown   PetscScalar    one = 1.0,zero = 0.0,negativeone = -1.0;
11c4762a1bSJed Brown   PetscReal      norm;
12c4762a1bSJed Brown   Vec            x,y;
13c4762a1bSJed Brown 
14*327415f7SBarry Smith   PetscFunctionBeginUser;
159566063dSJacob Faibussowitsch   PetscCall(PetscInitialize(&argc,&args,(char*)0,help));
169566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetInt(NULL,NULL,"-m",&m,NULL));
17c4762a1bSJed Brown 
18c4762a1bSJed Brown   for (i=0; i<2; i++) {
19c4762a1bSJed Brown     /* Create the matrix and set it to contain explicit zero entries on the diagonal. */
209566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_WORLD,&A));
219566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(A,PETSC_DECIDE,PETSC_DECIDE,m*m,m*m));
229566063dSJacob Faibussowitsch     PetscCall(MatSetFromOptions(A));
239566063dSJacob Faibussowitsch     PetscCall(MatSetUp(A));
249566063dSJacob Faibussowitsch     PetscCall(MatGetOwnershipRange(A,&rstart,&rend));
259566063dSJacob Faibussowitsch     PetscCall(MatCreateVecs(A,&x,&y));
269566063dSJacob Faibussowitsch     PetscCall(VecSet(x,one));
279566063dSJacob Faibussowitsch     PetscCall(VecSet(y,zero));
289566063dSJacob Faibussowitsch     PetscCall(MatDiagonalSet(A,y,INSERT_VALUES));
29c4762a1bSJed Brown 
30c4762a1bSJed Brown     /* Now set A to be the identity using various approaches.
31c4762a1bSJed Brown      * Note that there may be other approaches that should be added here. */
32c4762a1bSJed Brown     switch (i) {
33c4762a1bSJed Brown     case 0:
349566063dSJacob Faibussowitsch       PetscCall(MatDiagonalSet(A,x,INSERT_VALUES));
35c4762a1bSJed Brown       break;
36c4762a1bSJed Brown     case 1:
37c4762a1bSJed Brown       for (j=rstart; j<rend; j++) {
389566063dSJacob Faibussowitsch         PetscCall(MatSetValue(A,j,j,one,INSERT_VALUES));
39c4762a1bSJed Brown       }
409566063dSJacob Faibussowitsch       PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY));
419566063dSJacob Faibussowitsch       PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY));
42c4762a1bSJed Brown       break;
43c4762a1bSJed Brown     case 2:
44c4762a1bSJed Brown       for (j=rstart; j<rend; j++) {
459566063dSJacob Faibussowitsch         PetscCall(MatSetValuesRow(A,j,&one));
46c4762a1bSJed Brown       }
479566063dSJacob Faibussowitsch       PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY));
489566063dSJacob Faibussowitsch       PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY));
49c4762a1bSJed Brown     default:
50c4762a1bSJed Brown       break;
51c4762a1bSJed Brown     }
52c4762a1bSJed Brown 
53c4762a1bSJed Brown     /* Compute y <- A*x and verify that the difference between y and x is negligible, as it should be since A is the identity. */
549566063dSJacob Faibussowitsch     PetscCall(MatMult(A,x,y));
559566063dSJacob Faibussowitsch     PetscCall(VecAXPY(y,negativeone,x));
569566063dSJacob Faibussowitsch     PetscCall(VecNorm(y,NORM_2,&norm));
57c4762a1bSJed Brown     if (norm > PETSC_SQRT_MACHINE_EPSILON) {
589566063dSJacob Faibussowitsch       PetscCall(PetscPrintf(PETSC_COMM_WORLD,"Test %" PetscInt_FMT ": Norm of error is %g, but should be near 0.\n",i,(double)norm));
59c4762a1bSJed Brown     }
60c4762a1bSJed Brown 
619566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&A));
629566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&x));
639566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&y));
64c4762a1bSJed Brown   }
65c4762a1bSJed Brown 
669566063dSJacob Faibussowitsch   PetscCall(PetscFinalize());
67b122ec5aSJacob Faibussowitsch   return 0;
68c4762a1bSJed Brown }
69c4762a1bSJed Brown 
70c4762a1bSJed Brown /*TEST
71c4762a1bSJed Brown 
72c4762a1bSJed Brown    test:
73c4762a1bSJed Brown       suffix: aijviennacl_1
74c4762a1bSJed Brown       nsize: 1
75c4762a1bSJed Brown       args: -mat_type aijviennacl
76c4762a1bSJed Brown       requires: viennacl
77c4762a1bSJed Brown 
78c4762a1bSJed Brown    test:
79c4762a1bSJed Brown       suffix: aijviennacl_2
80c4762a1bSJed Brown       nsize: 2
81c4762a1bSJed Brown       args: -mat_type aijviennacl
82c4762a1bSJed Brown       requires: viennacl
83c4762a1bSJed Brown 
84c4762a1bSJed Brown    test:
85c4762a1bSJed Brown       suffix: aijcusparse_1
86c4762a1bSJed Brown       nsize: 1
87c4762a1bSJed Brown       args: -mat_type aijcusparse
88c4762a1bSJed Brown       requires: cuda
89c4762a1bSJed Brown 
90c4762a1bSJed Brown    test:
91c4762a1bSJed Brown       suffix: aijcusparse_2
92c4762a1bSJed Brown       nsize: 2
93c4762a1bSJed Brown       args: -mat_type aijcusparse
94c4762a1bSJed Brown       requires: cuda
95c4762a1bSJed Brown TEST*/
96