16f79c3a4SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/matimpl.h> /*I "petscmat.h" I*/ 36f79c3a4SBarry Smith 406be10caSBarry Smith /*@ 521c89e3eSBarry Smith MatAXPY - Computes Y = a*X + Y. 66f79c3a4SBarry Smith 73f9fe445SBarry Smith Logically Collective on Mat 8fee21e36SBarry Smith 998a79cdbSBarry Smith Input Parameters: 10607cd303SBarry Smith + a - the scalar multiplier 11607cd303SBarry Smith . X - the first matrix 12607cd303SBarry Smith . Y - the second matrix 13407f6b05SHong Zhang - str - either SAME_NONZERO_PATTERN, DIFFERENT_NONZERO_PATTERN 14407f6b05SHong Zhang or SUBSET_NONZERO_PATTERN (nonzeros of X is a subset of Y's) 1598a79cdbSBarry Smith 162860a424SLois Curfman McInnes Level: intermediate 172860a424SLois Curfman McInnes 189cf4f1e8SLois Curfman McInnes .keywords: matrix, add 19d4bb536fSBarry Smith 202860a424SLois Curfman McInnes .seealso: MatAYPX() 2106be10caSBarry Smith @*/ 227087cfbeSBarry Smith PetscErrorCode MatAXPY(Mat Y,PetscScalar a,Mat X,MatStructure str) 236f79c3a4SBarry Smith { 246849ba73SBarry Smith PetscErrorCode ierr; 25*646531bbSStefano Zampini PetscInt M1,M2,N1,N2; 26c1ac3661SBarry Smith PetscInt m1,m2,n1,n2; 270ff8bee4SStefano Zampini PetscBool sametype; 286f79c3a4SBarry Smith 293a40ed3dSBarry Smith PetscFunctionBegin; 300700a824SBarry Smith PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 31c5eb9154SBarry Smith PetscValidLogicalCollectiveScalar(Y,a,2); 32*646531bbSStefano Zampini PetscValidHeaderSpecific(X,MAT_CLASSID,3); 33*646531bbSStefano Zampini PetscCheckSameComm(Y,1,X,3); 34*646531bbSStefano Zampini ierr = MatGetSize(X,&M1,&N1);CHKERRQ(ierr); 35*646531bbSStefano Zampini ierr = MatGetSize(Y,&M2,&N2);CHKERRQ(ierr); 36*646531bbSStefano Zampini ierr = MatGetLocalSize(X,&m1,&n1);CHKERRQ(ierr); 37*646531bbSStefano Zampini ierr = MatGetLocalSize(Y,&m2,&n2);CHKERRQ(ierr); 38*646531bbSStefano Zampini if (M1 != M2 || N1 != N2) SETERRQ4(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_SIZ,"Non conforming matrix add: global sizes %D x %D, %D x %D",M1,M2,N1,N2); 39*646531bbSStefano Zampini if (m1 != m2 || n1 != n2) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Non conforming matrix add: local sizes %D x %D, %D x %D",m1,m2,n1,n2); 401987afe7SBarry Smith 410ff8bee4SStefano Zampini ierr = PetscStrcmp(((PetscObject)X)->type_name,((PetscObject)Y)->type_name,&sametype);CHKERRQ(ierr); 42e8136da8SHong Zhang ierr = PetscLogEventBegin(MAT_AXPY,Y,0,0,0);CHKERRQ(ierr); 430ff8bee4SStefano Zampini if (Y->ops->axpy && sametype) { 44f4df32b1SMatthew Knepley ierr = (*Y->ops->axpy)(Y,a,X,str);CHKERRQ(ierr); 45d4bb536fSBarry Smith } else { 46*646531bbSStefano Zampini if (str != DIFFERENT_NONZERO_PATTERN) { 47f4df32b1SMatthew Knepley ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 48*646531bbSStefano Zampini } else { 49*646531bbSStefano Zampini Mat B; 50*646531bbSStefano Zampini 51*646531bbSStefano Zampini ierr = MatAXPY_Basic_Preallocate(Y,X,&B);CHKERRQ(ierr); 52*646531bbSStefano Zampini ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 53*646531bbSStefano Zampini ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 54*646531bbSStefano Zampini } 55607cd303SBarry Smith } 56e8136da8SHong Zhang ierr = PetscLogEventEnd(MAT_AXPY,Y,0,0,0);CHKERRQ(ierr); 57fd314934SBarry Smith #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 58b8ced49eSKarl Rupp if (Y->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) { 59b8ced49eSKarl Rupp Y->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 60c41cb2e2SAlejandro Lamas Daviña } 61d67ff14aSKarl Rupp #endif 62607cd303SBarry Smith PetscFunctionReturn(0); 63607cd303SBarry Smith } 64607cd303SBarry Smith 65*646531bbSStefano Zampini PetscErrorCode MatAXPY_Basic_Preallocate(Mat Y, Mat X, Mat *B) 66*646531bbSStefano Zampini { 67*646531bbSStefano Zampini PetscErrorCode ierr; 68*646531bbSStefano Zampini 69*646531bbSStefano Zampini PetscFunctionBegin; 70*646531bbSStefano Zampini /* look for any available faster alternative to the general preallocator */ 71*646531bbSStefano Zampini PetscErrorCode (*preall)(Mat,Mat,Mat*) = NULL; 72*646531bbSStefano Zampini ierr = PetscObjectQueryFunction((PetscObject)Y,"MatAXPYGetPreallocation_C",&preall);CHKERRQ(ierr); 73*646531bbSStefano Zampini if (preall) { 74*646531bbSStefano Zampini ierr = (*preall)(Y,X,B);CHKERRQ(ierr); 75*646531bbSStefano Zampini } else { /* Use MatPrellocator, assumes same row-col distribution */ 76*646531bbSStefano Zampini Mat preallocator; 77*646531bbSStefano Zampini PetscInt r,rstart,rend; 78*646531bbSStefano Zampini PetscInt m,n,M,N; 79*646531bbSStefano Zampini 80*646531bbSStefano Zampini ierr = MatGetSize(Y,&M,&N);CHKERRQ(ierr); 81*646531bbSStefano Zampini ierr = MatGetLocalSize(Y,&m,&n);CHKERRQ(ierr); 82*646531bbSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)Y),&preallocator);CHKERRQ(ierr); 83*646531bbSStefano Zampini ierr = MatSetType(preallocator,MATPREALLOCATOR);CHKERRQ(ierr); 84*646531bbSStefano Zampini ierr = MatSetSizes(preallocator,m,n,M,N);CHKERRQ(ierr); 85*646531bbSStefano Zampini ierr = MatSetUp(preallocator);CHKERRQ(ierr); 86*646531bbSStefano Zampini ierr = MatGetOwnershipRange(preallocator,&rstart,&rend);CHKERRQ(ierr); 87*646531bbSStefano Zampini for (r = rstart; r < rend; ++r) { 88*646531bbSStefano Zampini PetscInt ncols; 89*646531bbSStefano Zampini const PetscInt *row; 90*646531bbSStefano Zampini const PetscScalar *vals; 91*646531bbSStefano Zampini 92*646531bbSStefano Zampini ierr = MatGetRow(Y,r,&ncols,&row,&vals);CHKERRQ(ierr); 93*646531bbSStefano Zampini ierr = MatSetValues(preallocator,1,&r,ncols,row,vals,INSERT_VALUES);CHKERRQ(ierr); 94*646531bbSStefano Zampini ierr = MatRestoreRow(Y,r,&ncols,&row,&vals);CHKERRQ(ierr); 95*646531bbSStefano Zampini ierr = MatGetRow(X,r,&ncols,&row,&vals);CHKERRQ(ierr); 96*646531bbSStefano Zampini ierr = MatSetValues(preallocator,1,&r,ncols,row,vals,INSERT_VALUES);CHKERRQ(ierr); 97*646531bbSStefano Zampini ierr = MatRestoreRow(X,r,&ncols,&row,&vals);CHKERRQ(ierr); 98*646531bbSStefano Zampini } 99*646531bbSStefano Zampini ierr = MatAssemblyBegin(preallocator,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 100*646531bbSStefano Zampini ierr = MatAssemblyEnd(preallocator,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 101*646531bbSStefano Zampini 102*646531bbSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)Y),B);CHKERRQ(ierr); 103*646531bbSStefano Zampini ierr = MatSetType(*B,((PetscObject)Y)->type_name);CHKERRQ(ierr); 104*646531bbSStefano Zampini ierr = MatSetSizes(*B,m,n,M,N);CHKERRQ(ierr); 105*646531bbSStefano Zampini ierr = MatPreallocatorPreallocate(preallocator,PETSC_FALSE,*B);CHKERRQ(ierr); 106*646531bbSStefano Zampini ierr = MatDestroy(&preallocator);CHKERRQ(ierr); 107*646531bbSStefano Zampini } 108*646531bbSStefano Zampini PetscFunctionReturn(0); 109*646531bbSStefano Zampini } 110*646531bbSStefano Zampini 111f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_Basic(Mat Y,PetscScalar a,Mat X,MatStructure str) 112607cd303SBarry Smith { 11338baddfdSBarry Smith PetscInt i,start,end,j,ncols,m,n; 1146849ba73SBarry Smith PetscErrorCode ierr; 11538baddfdSBarry Smith const PetscInt *row; 116b3cc6726SBarry Smith PetscScalar *val; 117b3cc6726SBarry Smith const PetscScalar *vals; 118607cd303SBarry Smith 119607cd303SBarry Smith PetscFunctionBegin; 1208dadbd76SSatish Balay ierr = MatGetSize(X,&m,&n);CHKERRQ(ierr); 12190f02eecSBarry Smith ierr = MatGetOwnershipRange(X,&start,&end);CHKERRQ(ierr); 122f4df32b1SMatthew Knepley if (a == 1.0) { 123d4bb536fSBarry Smith for (i = start; i < end; i++) { 124d4bb536fSBarry Smith ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 125d4bb536fSBarry Smith ierr = MatSetValues(Y,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 126d4bb536fSBarry Smith ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 127d4bb536fSBarry Smith } 128d4bb536fSBarry Smith } else { 129854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&val);CHKERRQ(ierr); 13006be10caSBarry Smith for (i=start; i<end; i++) { 131b3cc6726SBarry Smith ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 13206be10caSBarry Smith for (j=0; j<ncols; j++) { 133f4df32b1SMatthew Knepley val[j] = a*vals[j]; 1346f79c3a4SBarry Smith } 135b3cc6726SBarry Smith ierr = MatSetValues(Y,1,&i,ncols,row,val,ADD_VALUES);CHKERRQ(ierr); 136b3cc6726SBarry Smith ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 1376f79c3a4SBarry Smith } 138b3cc6726SBarry Smith ierr = PetscFree(val);CHKERRQ(ierr); 139d4bb536fSBarry Smith } 1406d4a8577SBarry Smith ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1416d4a8577SBarry Smith ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1423a40ed3dSBarry Smith PetscFunctionReturn(0); 1436f79c3a4SBarry Smith } 144052efed2SBarry Smith 145ec7775f6SShri Abhyankar PetscErrorCode MatAXPY_BasicWithPreallocation(Mat B,Mat Y,PetscScalar a,Mat X,MatStructure str) 146ec7775f6SShri Abhyankar { 147ec7775f6SShri Abhyankar PetscInt i,start,end,j,ncols,m,n; 148ec7775f6SShri Abhyankar PetscErrorCode ierr; 149ec7775f6SShri Abhyankar const PetscInt *row; 150ec7775f6SShri Abhyankar PetscScalar *val; 151ec7775f6SShri Abhyankar const PetscScalar *vals; 152ec7775f6SShri Abhyankar 153ec7775f6SShri Abhyankar PetscFunctionBegin; 154ec7775f6SShri Abhyankar ierr = MatGetSize(X,&m,&n);CHKERRQ(ierr); 155ec7775f6SShri Abhyankar ierr = MatGetOwnershipRange(X,&start,&end);CHKERRQ(ierr); 156ec7775f6SShri Abhyankar if (a == 1.0) { 157ec7775f6SShri Abhyankar for (i = start; i < end; i++) { 158ec7775f6SShri Abhyankar ierr = MatGetRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 159ec7775f6SShri Abhyankar ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 160ec7775f6SShri Abhyankar ierr = MatRestoreRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 161ec7775f6SShri Abhyankar 162ec7775f6SShri Abhyankar ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 163ec7775f6SShri Abhyankar ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 164ec7775f6SShri Abhyankar ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 165ec7775f6SShri Abhyankar } 166ec7775f6SShri Abhyankar } else { 167854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&val);CHKERRQ(ierr); 168ec7775f6SShri Abhyankar for (i=start; i<end; i++) { 169ec7775f6SShri Abhyankar ierr = MatGetRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 170ec7775f6SShri Abhyankar ierr = MatSetValues(B,1,&i,ncols,row,vals,ADD_VALUES);CHKERRQ(ierr); 171ec7775f6SShri Abhyankar ierr = MatRestoreRow(Y,i,&ncols,&row,&vals);CHKERRQ(ierr); 172ec7775f6SShri Abhyankar 173ec7775f6SShri Abhyankar ierr = MatGetRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 174ec7775f6SShri Abhyankar for (j=0; j<ncols; j++) { 175ec7775f6SShri Abhyankar val[j] = a*vals[j]; 176ec7775f6SShri Abhyankar } 177ec7775f6SShri Abhyankar ierr = MatSetValues(B,1,&i,ncols,row,val,ADD_VALUES);CHKERRQ(ierr); 178ec7775f6SShri Abhyankar ierr = MatRestoreRow(X,i,&ncols,&row,&vals);CHKERRQ(ierr); 179ec7775f6SShri Abhyankar } 180ec7775f6SShri Abhyankar ierr = PetscFree(val);CHKERRQ(ierr); 181ec7775f6SShri Abhyankar } 182ec7775f6SShri Abhyankar ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 183ec7775f6SShri Abhyankar ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 184ec7775f6SShri Abhyankar PetscFunctionReturn(0); 185ec7775f6SShri Abhyankar } 186ec7775f6SShri Abhyankar 187052efed2SBarry Smith /*@ 18887828ca2SBarry Smith MatShift - Computes Y = Y + a I, where a is a PetscScalar and I is the identity matrix. 189052efed2SBarry Smith 1903f9fe445SBarry Smith Neighbor-wise Collective on Mat 191fee21e36SBarry Smith 19298a79cdbSBarry Smith Input Parameters: 19398a79cdbSBarry Smith + Y - the matrices 19487828ca2SBarry Smith - a - the PetscScalar 19598a79cdbSBarry Smith 1962860a424SLois Curfman McInnes Level: intermediate 1972860a424SLois Curfman McInnes 19895452b02SPatrick Sanan Notes: 19995452b02SPatrick Sanan If the matrix Y is missing some diagonal entries this routine can be very slow. To make it fast one should initially 2006f33a894SBarry Smith fill the matrix so that all diagonal entries have a value (with a value of zero for those locations that would not have an 2016f33a894SBarry Smith entry). 2026f33a894SBarry Smith 2030c0fd78eSBarry Smith To form Y = Y + diag(V) use MatDiagonalSet() 2040c0fd78eSBarry Smith 2056f33a894SBarry Smith Developers Note: If the local "diagonal part" of the matrix Y has no entries then the local diagonal part is 2066f33a894SBarry Smith preallocated with 1 nonzero per row for the to be added values. This allows for fast shifting of an empty matrix. 2076f33a894SBarry Smith 208052efed2SBarry Smith .keywords: matrix, add, shift 2096b9ee512SLois Curfman McInnes 2100c0fd78eSBarry Smith .seealso: MatDiagonalSet(), MatScale(), MatDiagonalScale() 211052efed2SBarry Smith @*/ 2127087cfbeSBarry Smith PetscErrorCode MatShift(Mat Y,PetscScalar a) 213052efed2SBarry Smith { 2146849ba73SBarry Smith PetscErrorCode ierr; 215052efed2SBarry Smith 2163a40ed3dSBarry Smith PetscFunctionBegin; 2170700a824SBarry Smith PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 218ce94432eSBarry Smith if (!Y->assembled) SETERRQ(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 219ce94432eSBarry Smith if (Y->factortype) SETERRQ(PetscObjectComm((PetscObject)Y),PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2204994cf47SJed Brown MatCheckPreallocated(Y,1); 221b50b34bdSBarry Smith 2221c738b47SStefano Zampini if (Y->ops->shift) { 223f4df32b1SMatthew Knepley ierr = (*Y->ops->shift)(Y,a);CHKERRQ(ierr); 2241c738b47SStefano Zampini } else { 2251c738b47SStefano Zampini ierr = MatShift_Basic(Y,a);CHKERRQ(ierr); 2261c738b47SStefano Zampini } 2277d68702bSBarry Smith 2285528ad4fSTristan Konolige ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 229fd314934SBarry Smith #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 230b8ced49eSKarl Rupp if (Y->valid_GPU_matrix != PETSC_OFFLOAD_UNALLOCATED) { 231b8ced49eSKarl Rupp Y->valid_GPU_matrix = PETSC_OFFLOAD_CPU; 232c41cb2e2SAlejandro Lamas Daviña } 233d67ff14aSKarl Rupp #endif 2343a40ed3dSBarry Smith PetscFunctionReturn(0); 235052efed2SBarry Smith } 2366d84be18SBarry Smith 2377087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_Default(Mat Y,Vec D,InsertMode is) 23809f38230SBarry Smith { 23909f38230SBarry Smith PetscErrorCode ierr; 24067576b8bSBarry Smith PetscInt i,start,end; 24109f38230SBarry Smith PetscScalar *v; 24209f38230SBarry Smith 24309f38230SBarry Smith PetscFunctionBegin; 24409f38230SBarry Smith ierr = MatGetOwnershipRange(Y,&start,&end);CHKERRQ(ierr); 24509f38230SBarry Smith ierr = VecGetArray(D,&v);CHKERRQ(ierr); 24609f38230SBarry Smith for (i=start; i<end; i++) { 24709f38230SBarry Smith ierr = MatSetValues(Y,1,&i,1,&i,v+i-start,is);CHKERRQ(ierr); 24809f38230SBarry Smith } 24909f38230SBarry Smith ierr = VecRestoreArray(D,&v);CHKERRQ(ierr); 25009f38230SBarry Smith ierr = MatAssemblyBegin(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 25109f38230SBarry Smith ierr = MatAssemblyEnd(Y,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 25209f38230SBarry Smith PetscFunctionReturn(0); 25309f38230SBarry Smith } 25409f38230SBarry Smith 2556d84be18SBarry Smith /*@ 256f56f2b3fSBarry Smith MatDiagonalSet - Computes Y = Y + D, where D is a diagonal matrix 257f56f2b3fSBarry Smith that is represented as a vector. Or Y[i,i] = D[i] if InsertMode is 258f56f2b3fSBarry Smith INSERT_VALUES. 2596d84be18SBarry Smith 2606d84be18SBarry Smith Input Parameters: 26198a79cdbSBarry Smith + Y - the input matrix 262f56f2b3fSBarry Smith . D - the diagonal matrix, represented as a vector 263f56f2b3fSBarry Smith - i - INSERT_VALUES or ADD_VALUES 2646d84be18SBarry Smith 2653f9fe445SBarry Smith Neighbor-wise Collective on Mat and Vec 266fee21e36SBarry Smith 26795452b02SPatrick Sanan Notes: 26895452b02SPatrick Sanan If the matrix Y is missing some diagonal entries this routine can be very slow. To make it fast one should initially 2696f33a894SBarry Smith fill the matrix so that all diagonal entries have a value (with a value of zero for those locations that would not have an 2706f33a894SBarry Smith entry). 2716f33a894SBarry Smith 2722860a424SLois Curfman McInnes Level: intermediate 2732860a424SLois Curfman McInnes 2746b9ee512SLois Curfman McInnes .keywords: matrix, add, shift, diagonal 2756b9ee512SLois Curfman McInnes 2760c0fd78eSBarry Smith .seealso: MatShift(), MatScale(), MatDiagonalScale() 2776d84be18SBarry Smith @*/ 2787087cfbeSBarry Smith PetscErrorCode MatDiagonalSet(Mat Y,Vec D,InsertMode is) 2796d84be18SBarry Smith { 2806849ba73SBarry Smith PetscErrorCode ierr; 28167576b8bSBarry Smith PetscInt matlocal,veclocal; 2826d84be18SBarry Smith 2833a40ed3dSBarry Smith PetscFunctionBegin; 2840700a824SBarry Smith PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 2850700a824SBarry Smith PetscValidHeaderSpecific(D,VEC_CLASSID,2); 28667576b8bSBarry Smith ierr = MatGetLocalSize(Y,&matlocal,NULL);CHKERRQ(ierr); 28767576b8bSBarry Smith ierr = VecGetLocalSize(D,&veclocal);CHKERRQ(ierr); 28867576b8bSBarry Smith if (matlocal != veclocal) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number local rows of matrix %D does not match that of vector for diagonal %D",matlocal,veclocal); 289f56f2b3fSBarry Smith if (Y->ops->diagonalset) { 290f56f2b3fSBarry Smith ierr = (*Y->ops->diagonalset)(Y,D,is);CHKERRQ(ierr); 29194d884c6SBarry Smith } else { 29209f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 2936d84be18SBarry Smith } 2945528ad4fSTristan Konolige ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 2953a40ed3dSBarry Smith PetscFunctionReturn(0); 2966d84be18SBarry Smith } 297d4bb536fSBarry Smith 298d4bb536fSBarry Smith /*@ 29904aac2b0SHong Zhang MatAYPX - Computes Y = a*Y + X. 300d4bb536fSBarry Smith 3013f9fe445SBarry Smith Logically on Mat 302fee21e36SBarry Smith 30398a79cdbSBarry Smith Input Parameters: 30404aac2b0SHong Zhang + a - the PetscScalar multiplier 30504aac2b0SHong Zhang . Y - the first matrix 30604aac2b0SHong Zhang . X - the second matrix 30704aac2b0SHong Zhang - str - either SAME_NONZERO_PATTERN, DIFFERENT_NONZERO_PATTERN or SUBSET_NONZERO_PATTERN 308d4bb536fSBarry Smith 3092860a424SLois Curfman McInnes Level: intermediate 3102860a424SLois Curfman McInnes 311d4bb536fSBarry Smith .keywords: matrix, add 312d4bb536fSBarry Smith 3132860a424SLois Curfman McInnes .seealso: MatAXPY() 314d4bb536fSBarry Smith @*/ 3157087cfbeSBarry Smith PetscErrorCode MatAYPX(Mat Y,PetscScalar a,Mat X,MatStructure str) 316d4bb536fSBarry Smith { 31787828ca2SBarry Smith PetscScalar one = 1.0; 3186849ba73SBarry Smith PetscErrorCode ierr; 31938baddfdSBarry Smith PetscInt mX,mY,nX,nY; 320d4bb536fSBarry Smith 3213a40ed3dSBarry Smith PetscFunctionBegin; 322c5eb9154SBarry Smith PetscValidHeaderSpecific(X,MAT_CLASSID,3); 3230700a824SBarry Smith PetscValidHeaderSpecific(Y,MAT_CLASSID,1); 324c5eb9154SBarry Smith PetscValidLogicalCollectiveScalar(Y,a,2); 325329f5518SBarry Smith ierr = MatGetSize(X,&mX,&nX);CHKERRQ(ierr); 326329f5518SBarry Smith ierr = MatGetSize(X,&mY,&nY);CHKERRQ(ierr); 327e32f2f54SBarry Smith if (mX != mY || nX != nY) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Non conforming matrices: %D %D first %D %D second",mX,mY,nX,nY); 328d4bb536fSBarry Smith 329f4df32b1SMatthew Knepley ierr = MatScale(Y,a);CHKERRQ(ierr); 330cb9801acSJed Brown ierr = MatAXPY(Y,one,X,str);CHKERRQ(ierr); 3313a40ed3dSBarry Smith PetscFunctionReturn(0); 332d4bb536fSBarry Smith } 333b0a32e0cSBarry Smith 334b0a32e0cSBarry Smith /*@ 335b0a32e0cSBarry Smith MatComputeExplicitOperator - Computes the explicit matrix 336b0a32e0cSBarry Smith 337b0a32e0cSBarry Smith Collective on Mat 338b0a32e0cSBarry Smith 339b0a32e0cSBarry Smith Input Parameter: 340b0a32e0cSBarry Smith . inmat - the matrix 341b0a32e0cSBarry Smith 342b0a32e0cSBarry Smith Output Parameter: 343f3b1f45cSBarry Smith . mat - the explict operator 344b0a32e0cSBarry Smith 345b0a32e0cSBarry Smith Notes: 346b0a32e0cSBarry Smith This computation is done by applying the operators to columns of the 347b0a32e0cSBarry Smith identity matrix. 348b0a32e0cSBarry Smith 349b0a32e0cSBarry Smith Currently, this routine uses a dense matrix format when 1 processor 350b0a32e0cSBarry Smith is used and a sparse format otherwise. This routine is costly in general, 351b0a32e0cSBarry Smith and is recommended for use only with relatively small systems. 352b0a32e0cSBarry Smith 353b0a32e0cSBarry Smith Level: advanced 354b0a32e0cSBarry Smith 355b0a32e0cSBarry Smith .keywords: Mat, compute, explicit, operator 356b0a32e0cSBarry Smith @*/ 3577087cfbeSBarry Smith PetscErrorCode MatComputeExplicitOperator(Mat inmat,Mat *mat) 358b0a32e0cSBarry Smith { 359dfbe8321SBarry Smith PetscErrorCode ierr; 360b0a32e0cSBarry Smith MPI_Comm comm; 36138baddfdSBarry Smith PetscMPIInt size; 362b0a32e0cSBarry Smith 363b0a32e0cSBarry Smith PetscFunctionBegin; 3640700a824SBarry Smith PetscValidHeaderSpecific(inmat,MAT_CLASSID,1); 3654482741eSBarry Smith PetscValidPointer(mat,2); 366b0a32e0cSBarry Smith 367ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)inmat,&comm);CHKERRQ(ierr); 368b0a32e0cSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 369b3d09e86SJed Brown ierr = MatConvert_Shell(inmat,size == 1 ? MATSEQDENSE : MATAIJ,MAT_INITIAL_MATRIX,mat);CHKERRQ(ierr); 37024f910e3SHong Zhang PetscFunctionReturn(0); 37124f910e3SHong Zhang } 3724325cce7SMatthew G Knepley 3734325cce7SMatthew G Knepley /*@ 374f3b1f45cSBarry Smith MatComputeExplicitOperatorTranspose - Computes the explicit matrix representation of 375f3b1f45cSBarry Smith a give matrix that can apply MatMultTranspose() 376f3b1f45cSBarry Smith 377f3b1f45cSBarry Smith Collective on Mat 378f3b1f45cSBarry Smith 379f3b1f45cSBarry Smith Input Parameter: 380f3b1f45cSBarry Smith . inmat - the matrix 381f3b1f45cSBarry Smith 382f3b1f45cSBarry Smith Output Parameter: 383f3b1f45cSBarry Smith . mat - the explict operator transposed 384f3b1f45cSBarry Smith 385f3b1f45cSBarry Smith Notes: 386f3b1f45cSBarry Smith This computation is done by applying the transpose of the operator to columns of the 387f3b1f45cSBarry Smith identity matrix. 388f3b1f45cSBarry Smith 389f3b1f45cSBarry Smith Currently, this routine uses a dense matrix format when 1 processor 390f3b1f45cSBarry Smith is used and a sparse format otherwise. This routine is costly in general, 391f3b1f45cSBarry Smith and is recommended for use only with relatively small systems. 392f3b1f45cSBarry Smith 393f3b1f45cSBarry Smith Level: advanced 394f3b1f45cSBarry Smith 395f3b1f45cSBarry Smith .keywords: Mat, compute, explicit, operator 396f3b1f45cSBarry Smith @*/ 397f3b1f45cSBarry Smith PetscErrorCode MatComputeExplicitOperatorTranspose(Mat inmat,Mat *mat) 398f3b1f45cSBarry Smith { 399f3b1f45cSBarry Smith Vec in,out; 400f3b1f45cSBarry Smith PetscErrorCode ierr; 401f3b1f45cSBarry Smith PetscInt i,m,n,M,N,*rows,start,end; 402f3b1f45cSBarry Smith MPI_Comm comm; 403f3b1f45cSBarry Smith PetscScalar *array,zero = 0.0,one = 1.0; 404f3b1f45cSBarry Smith PetscMPIInt size; 405f3b1f45cSBarry Smith 406f3b1f45cSBarry Smith PetscFunctionBegin; 407f3b1f45cSBarry Smith PetscValidHeaderSpecific(inmat,MAT_CLASSID,1); 408f3b1f45cSBarry Smith PetscValidPointer(mat,2); 409f3b1f45cSBarry Smith 410f3b1f45cSBarry Smith ierr = PetscObjectGetComm((PetscObject)inmat,&comm);CHKERRQ(ierr); 411f3b1f45cSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 412f3b1f45cSBarry Smith 413f3b1f45cSBarry Smith ierr = MatGetLocalSize(inmat,&m,&n);CHKERRQ(ierr); 414f3b1f45cSBarry Smith ierr = MatGetSize(inmat,&M,&N);CHKERRQ(ierr); 415f3b1f45cSBarry Smith ierr = MatCreateVecs(inmat,&in,&out);CHKERRQ(ierr); 416f3b1f45cSBarry Smith ierr = VecSetOption(in,VEC_IGNORE_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 417f3b1f45cSBarry Smith ierr = VecGetOwnershipRange(out,&start,&end);CHKERRQ(ierr); 418f3b1f45cSBarry Smith ierr = PetscMalloc1(m,&rows);CHKERRQ(ierr); 419f3b1f45cSBarry Smith for (i=0; i<m; i++) rows[i] = start + i; 420f3b1f45cSBarry Smith 421f3b1f45cSBarry Smith ierr = MatCreate(comm,mat);CHKERRQ(ierr); 422f3b1f45cSBarry Smith ierr = MatSetSizes(*mat,m,n,M,N);CHKERRQ(ierr); 423f3b1f45cSBarry Smith if (size == 1) { 424f3b1f45cSBarry Smith ierr = MatSetType(*mat,MATSEQDENSE);CHKERRQ(ierr); 425f3b1f45cSBarry Smith ierr = MatSeqDenseSetPreallocation(*mat,NULL);CHKERRQ(ierr); 426f3b1f45cSBarry Smith } else { 427f3b1f45cSBarry Smith ierr = MatSetType(*mat,MATMPIAIJ);CHKERRQ(ierr); 428f3b1f45cSBarry Smith ierr = MatMPIAIJSetPreallocation(*mat,n,NULL,N-n,NULL);CHKERRQ(ierr); 429f3b1f45cSBarry Smith } 430f3b1f45cSBarry Smith 431f3b1f45cSBarry Smith for (i=0; i<N; i++) { 432f3b1f45cSBarry Smith 433f3b1f45cSBarry Smith ierr = VecSet(in,zero);CHKERRQ(ierr); 434f3b1f45cSBarry Smith ierr = VecSetValues(in,1,&i,&one,INSERT_VALUES);CHKERRQ(ierr); 435f3b1f45cSBarry Smith ierr = VecAssemblyBegin(in);CHKERRQ(ierr); 436f3b1f45cSBarry Smith ierr = VecAssemblyEnd(in);CHKERRQ(ierr); 437f3b1f45cSBarry Smith 438f3b1f45cSBarry Smith ierr = MatMultTranspose(inmat,in,out);CHKERRQ(ierr); 439f3b1f45cSBarry Smith 440f3b1f45cSBarry Smith ierr = VecGetArray(out,&array);CHKERRQ(ierr); 441f3b1f45cSBarry Smith ierr = MatSetValues(*mat,m,rows,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 442f3b1f45cSBarry Smith ierr = VecRestoreArray(out,&array);CHKERRQ(ierr); 443f3b1f45cSBarry Smith 444f3b1f45cSBarry Smith } 445f3b1f45cSBarry Smith ierr = PetscFree(rows);CHKERRQ(ierr); 446f3b1f45cSBarry Smith ierr = VecDestroy(&out);CHKERRQ(ierr); 447f3b1f45cSBarry Smith ierr = VecDestroy(&in);CHKERRQ(ierr); 448f3b1f45cSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 449f3b1f45cSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 450f3b1f45cSBarry Smith PetscFunctionReturn(0); 451f3b1f45cSBarry Smith } 452f3b1f45cSBarry Smith 453f3b1f45cSBarry Smith /*@ 4544325cce7SMatthew G Knepley MatChop - Set all values in the matrix less than the tolerance to zero 4554325cce7SMatthew G Knepley 4564325cce7SMatthew G Knepley Input Parameters: 4574325cce7SMatthew G Knepley + A - The matrix 4584325cce7SMatthew G Knepley - tol - The zero tolerance 4594325cce7SMatthew G Knepley 4604325cce7SMatthew G Knepley Output Parameters: 4614325cce7SMatthew G Knepley . A - The chopped matrix 4624325cce7SMatthew G Knepley 4634325cce7SMatthew G Knepley Level: intermediate 4644325cce7SMatthew G Knepley 4654325cce7SMatthew G Knepley .seealso: MatCreate(), MatZeroEntries() 4663fc99919SSatish Balay @*/ 4674325cce7SMatthew G Knepley PetscErrorCode MatChop(Mat A, PetscReal tol) 4684325cce7SMatthew G Knepley { 4694325cce7SMatthew G Knepley PetscScalar *newVals; 4704325cce7SMatthew G Knepley PetscInt *newCols; 4714325cce7SMatthew G Knepley PetscInt rStart, rEnd, numRows, maxRows, r, colMax = 0; 4724325cce7SMatthew G Knepley PetscErrorCode ierr; 4734325cce7SMatthew G Knepley 4744325cce7SMatthew G Knepley PetscFunctionBegin; 4754325cce7SMatthew G Knepley ierr = MatGetOwnershipRange(A, &rStart, &rEnd);CHKERRQ(ierr); 4764325cce7SMatthew G Knepley for (r = rStart; r < rEnd; ++r) { 4774325cce7SMatthew G Knepley PetscInt ncols; 4784325cce7SMatthew G Knepley 4790298fd71SBarry Smith ierr = MatGetRow(A, r, &ncols, NULL, NULL);CHKERRQ(ierr); 4804325cce7SMatthew G Knepley colMax = PetscMax(colMax, ncols);CHKERRQ(ierr); 4810298fd71SBarry Smith ierr = MatRestoreRow(A, r, &ncols, NULL, NULL);CHKERRQ(ierr); 4824325cce7SMatthew G Knepley } 4834325cce7SMatthew G Knepley numRows = rEnd - rStart; 484b2566f29SBarry Smith ierr = MPIU_Allreduce(&numRows, &maxRows, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)A));CHKERRQ(ierr); 485dcca6d9dSJed Brown ierr = PetscMalloc2(colMax,&newCols,colMax,&newVals);CHKERRQ(ierr); 4864325cce7SMatthew G Knepley for (r = rStart; r < rStart+maxRows; ++r) { 4874325cce7SMatthew G Knepley const PetscScalar *vals; 4884325cce7SMatthew G Knepley const PetscInt *cols; 489fad45679SMatthew G. Knepley PetscInt ncols, newcols, c; 4904325cce7SMatthew G Knepley 4914325cce7SMatthew G Knepley if (r < rEnd) { 4924325cce7SMatthew G Knepley ierr = MatGetRow(A, r, &ncols, &cols, &vals);CHKERRQ(ierr); 4934325cce7SMatthew G Knepley for (c = 0; c < ncols; ++c) { 4944325cce7SMatthew G Knepley newCols[c] = cols[c]; 4954325cce7SMatthew G Knepley newVals[c] = PetscAbsScalar(vals[c]) < tol ? 0.0 : vals[c]; 4964325cce7SMatthew G Knepley } 497fad45679SMatthew G. Knepley newcols = ncols; 4984325cce7SMatthew G Knepley ierr = MatRestoreRow(A, r, &ncols, &cols, &vals);CHKERRQ(ierr); 499fad45679SMatthew G. Knepley ierr = MatSetValues(A, 1, &r, newcols, newCols, newVals, INSERT_VALUES);CHKERRQ(ierr); 5004325cce7SMatthew G Knepley } 5014325cce7SMatthew G Knepley ierr = MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 5024325cce7SMatthew G Knepley ierr = MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 5034325cce7SMatthew G Knepley } 5044325cce7SMatthew G Knepley ierr = PetscFree2(newCols,newVals);CHKERRQ(ierr); 5054325cce7SMatthew G Knepley PetscFunctionReturn(0); 5064325cce7SMatthew G Knepley } 507