1be1d678aSKris Buschelman #define PETSCMAT_DLL 2be1d678aSKris Buschelman 367e560aaSBarry Smith /* 467e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 567e560aaSBarry Smith */ 6289bc588SBarry Smith 77c4f633dSBarry Smith #include "../src/mat/impls/dense/seq/dense.h" 8f3da1532SBarry Smith #include "petscblaslapack.h" 9289bc588SBarry Smith 104a2ae208SSatish Balay #undef __FUNCT__ 114a2ae208SSatish Balay #define __FUNCT__ "MatAXPY_SeqDense" 12f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 131987afe7SBarry Smith { 141987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 15f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 1613f74950SBarry Smith PetscInt j; 170805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 18efee365bSSatish Balay PetscErrorCode ierr; 193a40ed3dSBarry Smith 203a40ed3dSBarry Smith PetscFunctionBegin; 21d0f46423SBarry Smith N = PetscBLASIntCast(X->rmap->n*X->cmap->n); 22d0f46423SBarry Smith m = PetscBLASIntCast(X->rmap->n); 230805154bSBarry Smith ldax = PetscBLASIntCast(x->lda); 240805154bSBarry Smith lday = PetscBLASIntCast(y->lda); 25a5ce6ee0Svictorle if (ldax>m || lday>m) { 26d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 27f4df32b1SMatthew Knepley BLASaxpy_(&m,&oalpha,x->v+j*ldax,&one,y->v+j*lday,&one); 28a5ce6ee0Svictorle } 29a5ce6ee0Svictorle } else { 30f4df32b1SMatthew Knepley BLASaxpy_(&N,&oalpha,x->v,&one,y->v,&one); 31a5ce6ee0Svictorle } 320450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 333a40ed3dSBarry Smith PetscFunctionReturn(0); 341987afe7SBarry Smith } 351987afe7SBarry Smith 364a2ae208SSatish Balay #undef __FUNCT__ 374a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_SeqDense" 38dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 39289bc588SBarry Smith { 40d0f46423SBarry Smith PetscInt N = A->rmap->n*A->cmap->n; 413a40ed3dSBarry Smith 423a40ed3dSBarry Smith PetscFunctionBegin; 434e220ebcSLois Curfman McInnes info->block_size = 1.0; 444e220ebcSLois Curfman McInnes info->nz_allocated = (double)N; 456de62eeeSBarry Smith info->nz_used = (double)N; 466de62eeeSBarry Smith info->nz_unneeded = (double)0; 474e220ebcSLois Curfman McInnes info->assemblies = (double)A->num_ass; 484e220ebcSLois Curfman McInnes info->mallocs = 0; 497adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 504e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 514e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 524e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 533a40ed3dSBarry Smith PetscFunctionReturn(0); 54289bc588SBarry Smith } 55289bc588SBarry Smith 564a2ae208SSatish Balay #undef __FUNCT__ 574a2ae208SSatish Balay #define __FUNCT__ "MatScale_SeqDense" 58f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 5980cd9d93SLois Curfman McInnes { 60273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 61f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 62efee365bSSatish Balay PetscErrorCode ierr; 630805154bSBarry Smith PetscBLASInt one = 1,j,nz,lda = PetscBLASIntCast(a->lda); 6480cd9d93SLois Curfman McInnes 653a40ed3dSBarry Smith PetscFunctionBegin; 66d0f46423SBarry Smith if (lda>A->rmap->n) { 67d0f46423SBarry Smith nz = PetscBLASIntCast(A->rmap->n); 68d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 69f4df32b1SMatthew Knepley BLASscal_(&nz,&oalpha,a->v+j*lda,&one); 70a5ce6ee0Svictorle } 71a5ce6ee0Svictorle } else { 72d0f46423SBarry Smith nz = PetscBLASIntCast(A->rmap->n*A->cmap->n); 73f4df32b1SMatthew Knepley BLASscal_(&nz,&oalpha,a->v,&one); 74a5ce6ee0Svictorle } 75efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 763a40ed3dSBarry Smith PetscFunctionReturn(0); 7780cd9d93SLois Curfman McInnes } 7880cd9d93SLois Curfman McInnes 791cbb95d3SBarry Smith #undef __FUNCT__ 801cbb95d3SBarry Smith #define __FUNCT__ "MatIsHermitian_SeqDense" 81ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 821cbb95d3SBarry Smith { 831cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 84d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,N; 851cbb95d3SBarry Smith PetscScalar *v = a->v; 861cbb95d3SBarry Smith 871cbb95d3SBarry Smith PetscFunctionBegin; 881cbb95d3SBarry Smith *fl = PETSC_FALSE; 89d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 901cbb95d3SBarry Smith N = a->lda; 911cbb95d3SBarry Smith 921cbb95d3SBarry Smith for (i=0; i<m; i++) { 931cbb95d3SBarry Smith for (j=i+1; j<m; j++) { 941cbb95d3SBarry Smith if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) PetscFunctionReturn(0); 951cbb95d3SBarry Smith } 961cbb95d3SBarry Smith } 971cbb95d3SBarry Smith *fl = PETSC_TRUE; 981cbb95d3SBarry Smith PetscFunctionReturn(0); 991cbb95d3SBarry Smith } 1001cbb95d3SBarry Smith 101b24902e0SBarry Smith #undef __FUNCT__ 102b24902e0SBarry Smith #define __FUNCT__ "MatDuplicateNoCreate_SeqDense" 103719d5645SBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 104b24902e0SBarry Smith { 105b24902e0SBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data,*l; 106b24902e0SBarry Smith PetscErrorCode ierr; 107b24902e0SBarry Smith PetscInt lda = (PetscInt)mat->lda,j,m; 108b24902e0SBarry Smith 109b24902e0SBarry Smith PetscFunctionBegin; 110719d5645SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,PETSC_NULL);CHKERRQ(ierr); 111b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 112b24902e0SBarry Smith l = (Mat_SeqDense*)newi->data; 113d0f46423SBarry Smith if (lda>A->rmap->n) { 114d0f46423SBarry Smith m = A->rmap->n; 115d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 116b24902e0SBarry Smith ierr = PetscMemcpy(l->v+j*m,mat->v+j*lda,m*sizeof(PetscScalar));CHKERRQ(ierr); 117b24902e0SBarry Smith } 118b24902e0SBarry Smith } else { 119d0f46423SBarry Smith ierr = PetscMemcpy(l->v,mat->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 120b24902e0SBarry Smith } 121b24902e0SBarry Smith } 122b24902e0SBarry Smith newi->assembled = PETSC_TRUE; 123b24902e0SBarry Smith PetscFunctionReturn(0); 124b24902e0SBarry Smith } 125b24902e0SBarry Smith 1264a2ae208SSatish Balay #undef __FUNCT__ 1274a2ae208SSatish Balay #define __FUNCT__ "MatDuplicate_SeqDense" 128dfbe8321SBarry Smith PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 12902cad45dSBarry Smith { 1306849ba73SBarry Smith PetscErrorCode ierr; 13102cad45dSBarry Smith 1323a40ed3dSBarry Smith PetscFunctionBegin; 1335c9eb25fSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,newmat);CHKERRQ(ierr); 134d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1355c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 136719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 137b24902e0SBarry Smith PetscFunctionReturn(0); 138b24902e0SBarry Smith } 139b24902e0SBarry Smith 1406ee01492SSatish Balay 1410481f469SBarry Smith extern PetscErrorCode MatLUFactor_SeqDense(Mat,IS,IS,const MatFactorInfo*); 142719d5645SBarry Smith 1434a2ae208SSatish Balay #undef __FUNCT__ 1444a2ae208SSatish Balay #define __FUNCT__ "MatLUFactorNumeric_SeqDense" 1450481f469SBarry Smith PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 146289bc588SBarry Smith { 1474482741eSBarry Smith MatFactorInfo info; 148a093e273SMatthew Knepley PetscErrorCode ierr; 1493a40ed3dSBarry Smith 1503a40ed3dSBarry Smith PetscFunctionBegin; 151c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 152719d5645SBarry Smith ierr = MatLUFactor_SeqDense(fact,0,0,&info);CHKERRQ(ierr); 1533a40ed3dSBarry Smith PetscFunctionReturn(0); 154289bc588SBarry Smith } 1556ee01492SSatish Balay 1560b4b3355SBarry Smith #undef __FUNCT__ 1574a2ae208SSatish Balay #define __FUNCT__ "MatSolve_SeqDense" 158dfbe8321SBarry Smith PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 159289bc588SBarry Smith { 160c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1616849ba73SBarry Smith PetscErrorCode ierr; 16287828ca2SBarry Smith PetscScalar *x,*y; 163d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 16467e560aaSBarry Smith 1653a40ed3dSBarry Smith PetscFunctionBegin; 1661ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 1671ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 168d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 169d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 170ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 171e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 172ae7cfcebSSatish Balay #else 17371044d3cSBarry Smith LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 174e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 175ae7cfcebSSatish Balay #endif 176d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY){ 177ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 178e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 179ae7cfcebSSatish Balay #else 18071044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 181e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 182ae7cfcebSSatish Balay #endif 183289bc588SBarry Smith } 184e32f2f54SBarry Smith else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 1851ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 1861ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 187dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 1883a40ed3dSBarry Smith PetscFunctionReturn(0); 189289bc588SBarry Smith } 1906ee01492SSatish Balay 1914a2ae208SSatish Balay #undef __FUNCT__ 1924a2ae208SSatish Balay #define __FUNCT__ "MatSolveTranspose_SeqDense" 193dfbe8321SBarry Smith PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 194da3a660dSBarry Smith { 195c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 196dfbe8321SBarry Smith PetscErrorCode ierr; 19787828ca2SBarry Smith PetscScalar *x,*y; 198d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 19967e560aaSBarry Smith 2003a40ed3dSBarry Smith PetscFunctionBegin; 2011ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2021ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 203d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 204752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 205da3a660dSBarry Smith if (mat->pivots) { 206ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 207e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 208ae7cfcebSSatish Balay #else 20971044d3cSBarry Smith LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 210e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 211ae7cfcebSSatish Balay #endif 2127a97a34bSBarry Smith } else { 213ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 214e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 215ae7cfcebSSatish Balay #else 21671044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 217e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 218ae7cfcebSSatish Balay #endif 219da3a660dSBarry Smith } 2201ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 2211ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 222dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 2233a40ed3dSBarry Smith PetscFunctionReturn(0); 224da3a660dSBarry Smith } 2256ee01492SSatish Balay 2264a2ae208SSatish Balay #undef __FUNCT__ 2274a2ae208SSatish Balay #define __FUNCT__ "MatSolveAdd_SeqDense" 228dfbe8321SBarry Smith PetscErrorCode MatSolveAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 229da3a660dSBarry Smith { 230c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 231dfbe8321SBarry Smith PetscErrorCode ierr; 23287828ca2SBarry Smith PetscScalar *x,*y,sone = 1.0; 233da3a660dSBarry Smith Vec tmp = 0; 234d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 23567e560aaSBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 2371ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2381ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 239d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 240da3a660dSBarry Smith if (yy == zz) { 24178b31e54SBarry Smith ierr = VecDuplicate(yy,&tmp);CHKERRQ(ierr); 24252e6d16bSBarry Smith ierr = PetscLogObjectParent(A,tmp);CHKERRQ(ierr); 24378b31e54SBarry Smith ierr = VecCopy(yy,tmp);CHKERRQ(ierr); 244da3a660dSBarry Smith } 245d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 246752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 247da3a660dSBarry Smith if (mat->pivots) { 248ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 249e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 250ae7cfcebSSatish Balay #else 25171044d3cSBarry Smith LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 252e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 253ae7cfcebSSatish Balay #endif 254a8c6a408SBarry Smith } else { 255ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 256e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 257ae7cfcebSSatish Balay #else 25871044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 259e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 260ae7cfcebSSatish Balay #endif 261da3a660dSBarry Smith } 2622dcb1b2aSMatthew Knepley if (tmp) {ierr = VecAXPY(yy,sone,tmp);CHKERRQ(ierr); ierr = VecDestroy(tmp);CHKERRQ(ierr);} 2632dcb1b2aSMatthew Knepley else {ierr = VecAXPY(yy,sone,zz);CHKERRQ(ierr);} 2641ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 2651ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 266dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n);CHKERRQ(ierr); 2673a40ed3dSBarry Smith PetscFunctionReturn(0); 268da3a660dSBarry Smith } 26967e560aaSBarry Smith 2704a2ae208SSatish Balay #undef __FUNCT__ 2714a2ae208SSatish Balay #define __FUNCT__ "MatSolveTransposeAdd_SeqDense" 272dfbe8321SBarry Smith PetscErrorCode MatSolveTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 273da3a660dSBarry Smith { 274c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 2756849ba73SBarry Smith PetscErrorCode ierr; 27687828ca2SBarry Smith PetscScalar *x,*y,sone = 1.0; 277da3a660dSBarry Smith Vec tmp; 278d0f46423SBarry Smith PetscBLASInt one = 1,info,m = PetscBLASIntCast(A->rmap->n); 27967e560aaSBarry Smith 2803a40ed3dSBarry Smith PetscFunctionBegin; 281d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 2821ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 2831ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 284da3a660dSBarry Smith if (yy == zz) { 28578b31e54SBarry Smith ierr = VecDuplicate(yy,&tmp);CHKERRQ(ierr); 28652e6d16bSBarry Smith ierr = PetscLogObjectParent(A,tmp);CHKERRQ(ierr); 28778b31e54SBarry Smith ierr = VecCopy(yy,tmp);CHKERRQ(ierr); 288da3a660dSBarry Smith } 289d0f46423SBarry Smith ierr = PetscMemcpy(y,x,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 290752f5567SLois Curfman McInnes /* assume if pivots exist then use LU; else Cholesky */ 291da3a660dSBarry Smith if (mat->pivots) { 292ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_GETRS) 293e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRS - Lapack routine is unavailable."); 294ae7cfcebSSatish Balay #else 29571044d3cSBarry Smith LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info); 296e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 297ae7cfcebSSatish Balay #endif 2983a40ed3dSBarry Smith } else { 299ae7cfcebSSatish Balay #if defined(PETSC_MISSING_LAPACK_POTRS) 300e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRS - Lapack routine is unavailable."); 301ae7cfcebSSatish Balay #else 30271044d3cSBarry Smith LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info); 303e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad solve"); 304ae7cfcebSSatish Balay #endif 305da3a660dSBarry Smith } 30690f02eecSBarry Smith if (tmp) { 3072dcb1b2aSMatthew Knepley ierr = VecAXPY(yy,sone,tmp);CHKERRQ(ierr); 30890f02eecSBarry Smith ierr = VecDestroy(tmp);CHKERRQ(ierr); 3093a40ed3dSBarry Smith } else { 3102dcb1b2aSMatthew Knepley ierr = VecAXPY(yy,sone,zz);CHKERRQ(ierr); 31190f02eecSBarry Smith } 3121ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 3131ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 314dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n);CHKERRQ(ierr); 3153a40ed3dSBarry Smith PetscFunctionReturn(0); 316da3a660dSBarry Smith } 317db4efbfdSBarry Smith 318db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 319db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 320db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 321db4efbfdSBarry Smith #undef __FUNCT__ 322db4efbfdSBarry Smith #define __FUNCT__ "MatLUFactor_SeqDense" 3230481f469SBarry Smith PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 324db4efbfdSBarry Smith { 325db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_GETRF) 326db4efbfdSBarry Smith PetscFunctionBegin; 327e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"GETRF - Lapack routine is unavailable."); 328db4efbfdSBarry Smith #else 329db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 330db4efbfdSBarry Smith PetscErrorCode ierr; 331db4efbfdSBarry Smith PetscBLASInt n,m,info; 332db4efbfdSBarry Smith 333db4efbfdSBarry Smith PetscFunctionBegin; 334db4efbfdSBarry Smith n = PetscBLASIntCast(A->cmap->n); 335db4efbfdSBarry Smith m = PetscBLASIntCast(A->rmap->n); 336db4efbfdSBarry Smith if (!mat->pivots) { 337db4efbfdSBarry Smith ierr = PetscMalloc((A->rmap->n+1)*sizeof(PetscBLASInt),&mat->pivots);CHKERRQ(ierr); 338db4efbfdSBarry Smith ierr = PetscLogObjectMemory(A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 339db4efbfdSBarry Smith } 340db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 341db4efbfdSBarry Smith LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info); 342e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 343e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 344db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 345db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 346db4efbfdSBarry Smith A->ops->solveadd = MatSolveAdd_SeqDense; 347db4efbfdSBarry Smith A->ops->solvetransposeadd = MatSolveTransposeAdd_SeqDense; 348d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 349db4efbfdSBarry Smith 350dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 351db4efbfdSBarry Smith #endif 352db4efbfdSBarry Smith PetscFunctionReturn(0); 353db4efbfdSBarry Smith } 354db4efbfdSBarry Smith 355db4efbfdSBarry Smith #undef __FUNCT__ 356db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactor_SeqDense" 3570481f469SBarry Smith PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 358db4efbfdSBarry Smith { 359db4efbfdSBarry Smith #if defined(PETSC_MISSING_LAPACK_POTRF) 360db4efbfdSBarry Smith PetscFunctionBegin; 361e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"POTRF - Lapack routine is unavailable."); 362db4efbfdSBarry Smith #else 363db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 364db4efbfdSBarry Smith PetscErrorCode ierr; 365db4efbfdSBarry Smith PetscBLASInt info,n = PetscBLASIntCast(A->cmap->n); 366db4efbfdSBarry Smith 367db4efbfdSBarry Smith PetscFunctionBegin; 368db4efbfdSBarry Smith ierr = PetscFree(mat->pivots);CHKERRQ(ierr); 369db4efbfdSBarry Smith mat->pivots = 0; 370db4efbfdSBarry Smith 371db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 372db4efbfdSBarry Smith LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info); 373e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 374db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 375db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 376db4efbfdSBarry Smith A->ops->solveadd = MatSolveAdd_SeqDense; 377db4efbfdSBarry Smith A->ops->solvetransposeadd = MatSolveTransposeAdd_SeqDense; 378d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 379dc0b31edSSatish Balay ierr = PetscLogFlops((A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 380db4efbfdSBarry Smith #endif 381db4efbfdSBarry Smith PetscFunctionReturn(0); 382db4efbfdSBarry Smith } 383db4efbfdSBarry Smith 384db4efbfdSBarry Smith 385db4efbfdSBarry Smith #undef __FUNCT__ 386db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactorNumeric_SeqDense" 3870481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 388db4efbfdSBarry Smith { 389db4efbfdSBarry Smith PetscErrorCode ierr; 390db4efbfdSBarry Smith MatFactorInfo info; 391db4efbfdSBarry Smith 392db4efbfdSBarry Smith PetscFunctionBegin; 393db4efbfdSBarry Smith info.fill = 1.0; 394c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 395719d5645SBarry Smith ierr = MatCholeskyFactor_SeqDense(fact,0,&info);CHKERRQ(ierr); 396db4efbfdSBarry Smith PetscFunctionReturn(0); 397db4efbfdSBarry Smith } 398db4efbfdSBarry Smith 399db4efbfdSBarry Smith #undef __FUNCT__ 400db4efbfdSBarry Smith #define __FUNCT__ "MatCholeskyFactorSymbolic_SeqDense" 4010481f469SBarry Smith PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 402db4efbfdSBarry Smith { 403db4efbfdSBarry Smith PetscFunctionBegin; 404c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 405719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 406db4efbfdSBarry Smith PetscFunctionReturn(0); 407db4efbfdSBarry Smith } 408db4efbfdSBarry Smith 409db4efbfdSBarry Smith #undef __FUNCT__ 410db4efbfdSBarry Smith #define __FUNCT__ "MatLUFactorSymbolic_SeqDense" 4110481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 412db4efbfdSBarry Smith { 413db4efbfdSBarry Smith PetscFunctionBegin; 414c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 415719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 416db4efbfdSBarry Smith PetscFunctionReturn(0); 417db4efbfdSBarry Smith } 418db4efbfdSBarry Smith 419bb5747d9SMatthew Knepley EXTERN_C_BEGIN 420db4efbfdSBarry Smith #undef __FUNCT__ 421db4efbfdSBarry Smith #define __FUNCT__ "MatGetFactor_seqdense_petsc" 422db4efbfdSBarry Smith PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 423db4efbfdSBarry Smith { 424db4efbfdSBarry Smith PetscErrorCode ierr; 425db4efbfdSBarry Smith 426db4efbfdSBarry Smith PetscFunctionBegin; 427db4efbfdSBarry Smith ierr = MatCreate(((PetscObject)A)->comm,fact);CHKERRQ(ierr); 428db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 429db4efbfdSBarry Smith ierr = MatSetType(*fact,((PetscObject)A)->type_name);CHKERRQ(ierr); 430db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU){ 431db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 432db4efbfdSBarry Smith } else { 433db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 434db4efbfdSBarry Smith } 435d5f3da31SBarry Smith (*fact)->factortype = ftype; 436db4efbfdSBarry Smith PetscFunctionReturn(0); 437db4efbfdSBarry Smith } 438bb5747d9SMatthew Knepley EXTERN_C_END 439db4efbfdSBarry Smith 440289bc588SBarry Smith /* ------------------------------------------------------------------*/ 4414a2ae208SSatish Balay #undef __FUNCT__ 44241f059aeSBarry Smith #define __FUNCT__ "MatSOR_SeqDense" 44341f059aeSBarry Smith PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 444289bc588SBarry Smith { 445c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 44687828ca2SBarry Smith PetscScalar *x,*b,*v = mat->v,zero = 0.0,xt; 447dfbe8321SBarry Smith PetscErrorCode ierr; 448d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 449aa482453SBarry Smith #if !defined(PETSC_USE_COMPLEX) 4500805154bSBarry Smith PetscBLASInt o = 1,bm = PetscBLASIntCast(m); 451bc1b551cSSatish Balay #endif 452289bc588SBarry Smith 4533a40ed3dSBarry Smith PetscFunctionBegin; 454289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 45571044d3cSBarry Smith /* this is a hack fix, should have another version without the second BLASdot */ 4562dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 457289bc588SBarry Smith } 4581ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 4591ebc52fbSHong Zhang ierr = VecGetArray(bb,&b);CHKERRQ(ierr); 460b965ef7fSBarry Smith its = its*lits; 461e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 462289bc588SBarry Smith while (its--) { 463fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP){ 464289bc588SBarry Smith for (i=0; i<m; i++) { 465aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 466f1747703SBarry Smith /* cannot use BLAS dot for complex because compiler/linker is 467f1747703SBarry Smith not happy about returning a double complex */ 46813f74950SBarry Smith PetscInt _i; 46987828ca2SBarry Smith PetscScalar sum = b[i]; 470f1747703SBarry Smith for (_i=0; _i<m; _i++) { 4713f6de6efSSatish Balay sum -= PetscConj(v[i+_i*m])*x[_i]; 472f1747703SBarry Smith } 473f1747703SBarry Smith xt = sum; 474f1747703SBarry Smith #else 47571044d3cSBarry Smith xt = b[i] - BLASdot_(&bm,v+i,&bm,x,&o); 476f1747703SBarry Smith #endif 47755a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 478289bc588SBarry Smith } 479289bc588SBarry Smith } 480fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP){ 481289bc588SBarry Smith for (i=m-1; i>=0; i--) { 482aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 483f1747703SBarry Smith /* cannot use BLAS dot for complex because compiler/linker is 484f1747703SBarry Smith not happy about returning a double complex */ 48513f74950SBarry Smith PetscInt _i; 48687828ca2SBarry Smith PetscScalar sum = b[i]; 487f1747703SBarry Smith for (_i=0; _i<m; _i++) { 4883f6de6efSSatish Balay sum -= PetscConj(v[i+_i*m])*x[_i]; 489f1747703SBarry Smith } 490f1747703SBarry Smith xt = sum; 491f1747703SBarry Smith #else 49271044d3cSBarry Smith xt = b[i] - BLASdot_(&bm,v+i,&bm,x,&o); 493f1747703SBarry Smith #endif 49455a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 495289bc588SBarry Smith } 496289bc588SBarry Smith } 497289bc588SBarry Smith } 4981ebc52fbSHong Zhang ierr = VecRestoreArray(bb,&b);CHKERRQ(ierr); 4991ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5003a40ed3dSBarry Smith PetscFunctionReturn(0); 501289bc588SBarry Smith } 502289bc588SBarry Smith 503289bc588SBarry Smith /* -----------------------------------------------------------------*/ 5044a2ae208SSatish Balay #undef __FUNCT__ 5054a2ae208SSatish Balay #define __FUNCT__ "MatMultTranspose_SeqDense" 506dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 507289bc588SBarry Smith { 508c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 50987828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y; 510dfbe8321SBarry Smith PetscErrorCode ierr; 5110805154bSBarry Smith PetscBLASInt m, n,_One=1; 512ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 5133a40ed3dSBarry Smith 5143a40ed3dSBarry Smith PetscFunctionBegin; 515d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 516d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 517d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 5181ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5191ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 52071044d3cSBarry Smith BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One); 5211ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5221ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 523dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 5243a40ed3dSBarry Smith PetscFunctionReturn(0); 525289bc588SBarry Smith } 526800995b7SMatthew Knepley 5274a2ae208SSatish Balay #undef __FUNCT__ 5284a2ae208SSatish Balay #define __FUNCT__ "MatMult_SeqDense" 529dfbe8321SBarry Smith PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 530289bc588SBarry Smith { 531c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 53287828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y,_DOne=1.0,_DZero=0.0; 533dfbe8321SBarry Smith PetscErrorCode ierr; 5340805154bSBarry Smith PetscBLASInt m, n, _One=1; 5353a40ed3dSBarry Smith 5363a40ed3dSBarry Smith PetscFunctionBegin; 537d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 538d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 539d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 5401ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5411ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 54271044d3cSBarry Smith BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One); 5431ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5441ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 545dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 5463a40ed3dSBarry Smith PetscFunctionReturn(0); 547289bc588SBarry Smith } 5486ee01492SSatish Balay 5494a2ae208SSatish Balay #undef __FUNCT__ 5504a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_SeqDense" 551dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 552289bc588SBarry Smith { 553c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 55487828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y,_DOne=1.0; 555dfbe8321SBarry Smith PetscErrorCode ierr; 5560805154bSBarry Smith PetscBLASInt m, n, _One=1; 5573a40ed3dSBarry Smith 5583a40ed3dSBarry Smith PetscFunctionBegin; 559d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 560d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 561d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 562600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 5631ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5641ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 56571044d3cSBarry Smith BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One); 5661ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5671ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 568dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 5693a40ed3dSBarry Smith PetscFunctionReturn(0); 570289bc588SBarry Smith } 5716ee01492SSatish Balay 5724a2ae208SSatish Balay #undef __FUNCT__ 5734a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_SeqDense" 574dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 575289bc588SBarry Smith { 576c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 57787828ca2SBarry Smith PetscScalar *v = mat->v,*x,*y; 578dfbe8321SBarry Smith PetscErrorCode ierr; 5790805154bSBarry Smith PetscBLASInt m, n, _One=1; 58087828ca2SBarry Smith PetscScalar _DOne=1.0; 5813a40ed3dSBarry Smith 5823a40ed3dSBarry Smith PetscFunctionBegin; 583d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 584d0f46423SBarry Smith n = PetscBLASIntCast(A->cmap->n); 585d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 586600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 5871ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 5881ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 58971044d3cSBarry Smith BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One); 5901ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 5911ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 592dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 5933a40ed3dSBarry Smith PetscFunctionReturn(0); 594289bc588SBarry Smith } 595289bc588SBarry Smith 596289bc588SBarry Smith /* -----------------------------------------------------------------*/ 5974a2ae208SSatish Balay #undef __FUNCT__ 5984a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_SeqDense" 59913f74950SBarry Smith PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 600289bc588SBarry Smith { 601c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 60287828ca2SBarry Smith PetscScalar *v; 6036849ba73SBarry Smith PetscErrorCode ierr; 60413f74950SBarry Smith PetscInt i; 60567e560aaSBarry Smith 6063a40ed3dSBarry Smith PetscFunctionBegin; 607d0f46423SBarry Smith *ncols = A->cmap->n; 608289bc588SBarry Smith if (cols) { 609d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscInt),cols);CHKERRQ(ierr); 610d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 611289bc588SBarry Smith } 612289bc588SBarry Smith if (vals) { 613d0f46423SBarry Smith ierr = PetscMalloc((A->cmap->n+1)*sizeof(PetscScalar),vals);CHKERRQ(ierr); 614289bc588SBarry Smith v = mat->v + row; 615d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 616289bc588SBarry Smith } 6173a40ed3dSBarry Smith PetscFunctionReturn(0); 618289bc588SBarry Smith } 6196ee01492SSatish Balay 6204a2ae208SSatish Balay #undef __FUNCT__ 6214a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_SeqDense" 62213f74950SBarry Smith PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 623289bc588SBarry Smith { 624dfbe8321SBarry Smith PetscErrorCode ierr; 625606d414cSSatish Balay PetscFunctionBegin; 626606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 627606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 6283a40ed3dSBarry Smith PetscFunctionReturn(0); 629289bc588SBarry Smith } 630289bc588SBarry Smith /* ----------------------------------------------------------------*/ 6314a2ae208SSatish Balay #undef __FUNCT__ 6324a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_SeqDense" 63313f74950SBarry Smith PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 634289bc588SBarry Smith { 635c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 63613f74950SBarry Smith PetscInt i,j,idx=0; 637d6dfbf8fSBarry Smith 6383a40ed3dSBarry Smith PetscFunctionBegin; 63971fd2e92SBarry Smith if (v) PetscValidScalarPointer(v,6); 640289bc588SBarry Smith if (!mat->roworiented) { 641dbb450caSBarry Smith if (addv == INSERT_VALUES) { 642289bc588SBarry Smith for (j=0; j<n; j++) { 643cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 6442515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 645e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 64658804f6dSBarry Smith #endif 647289bc588SBarry Smith for (i=0; i<m; i++) { 648cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 6492515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 650e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 65158804f6dSBarry Smith #endif 652cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 653289bc588SBarry Smith } 654289bc588SBarry Smith } 6553a40ed3dSBarry Smith } else { 656289bc588SBarry Smith for (j=0; j<n; j++) { 657cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 6582515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 659e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 66058804f6dSBarry Smith #endif 661289bc588SBarry Smith for (i=0; i<m; i++) { 662cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 6632515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 664e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 66558804f6dSBarry Smith #endif 666cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 667289bc588SBarry Smith } 668289bc588SBarry Smith } 669289bc588SBarry Smith } 6703a40ed3dSBarry Smith } else { 671dbb450caSBarry Smith if (addv == INSERT_VALUES) { 672e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 673cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 6742515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 675e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 67658804f6dSBarry Smith #endif 677e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 678cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 6792515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 680e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 68158804f6dSBarry Smith #endif 682cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 683e8d4e0b9SBarry Smith } 684e8d4e0b9SBarry Smith } 6853a40ed3dSBarry Smith } else { 686289bc588SBarry Smith for (i=0; i<m; i++) { 687cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 6882515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 689e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 69058804f6dSBarry Smith #endif 691289bc588SBarry Smith for (j=0; j<n; j++) { 692cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 6932515c552SBarry Smith #if defined(PETSC_USE_DEBUG) 694e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 69558804f6dSBarry Smith #endif 696cddbea37SSatish Balay mat->v[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 697289bc588SBarry Smith } 698289bc588SBarry Smith } 699289bc588SBarry Smith } 700e8d4e0b9SBarry Smith } 7013a40ed3dSBarry Smith PetscFunctionReturn(0); 702289bc588SBarry Smith } 703e8d4e0b9SBarry Smith 7044a2ae208SSatish Balay #undef __FUNCT__ 7054a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_SeqDense" 70613f74950SBarry Smith PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 707ae80bb75SLois Curfman McInnes { 708ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 70913f74950SBarry Smith PetscInt i,j; 710ae80bb75SLois Curfman McInnes 7113a40ed3dSBarry Smith PetscFunctionBegin; 712ae80bb75SLois Curfman McInnes /* row-oriented output */ 713ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 71497e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 715e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 716ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 7176f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 718e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 71997e567efSBarry Smith *v++ = mat->v[indexn[j]*mat->lda + indexm[i]]; 720ae80bb75SLois Curfman McInnes } 721ae80bb75SLois Curfman McInnes } 7223a40ed3dSBarry Smith PetscFunctionReturn(0); 723ae80bb75SLois Curfman McInnes } 724ae80bb75SLois Curfman McInnes 725289bc588SBarry Smith /* -----------------------------------------------------------------*/ 726289bc588SBarry Smith 7274a2ae208SSatish Balay #undef __FUNCT__ 7285bba2384SShri Abhyankar #define __FUNCT__ "MatLoad_SeqDense" 729112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqDense(Mat newmat,PetscViewer viewer) 730aabbc4fbSShri Abhyankar { 731aabbc4fbSShri Abhyankar Mat_SeqDense *a; 732aabbc4fbSShri Abhyankar PetscErrorCode ierr; 733aabbc4fbSShri Abhyankar PetscInt *scols,i,j,nz,header[4]; 734aabbc4fbSShri Abhyankar int fd; 735aabbc4fbSShri Abhyankar PetscMPIInt size; 736aabbc4fbSShri Abhyankar PetscInt *rowlengths = 0,M,N,*cols,grows,gcols; 737aabbc4fbSShri Abhyankar PetscScalar *vals,*svals,*v,*w; 738aabbc4fbSShri Abhyankar MPI_Comm comm = ((PetscObject)viewer)->comm; 739aabbc4fbSShri Abhyankar 740aabbc4fbSShri Abhyankar PetscFunctionBegin; 741aabbc4fbSShri Abhyankar ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 742aabbc4fbSShri Abhyankar if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"view must have one processor"); 743aabbc4fbSShri Abhyankar ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 744aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,header,4,PETSC_INT);CHKERRQ(ierr); 745aabbc4fbSShri Abhyankar if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not matrix object"); 746aabbc4fbSShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 747aabbc4fbSShri Abhyankar 748aabbc4fbSShri Abhyankar /* set global size if not set already*/ 749aabbc4fbSShri Abhyankar if (newmat->rmap->n < 0 && newmat->rmap->N < 0 && newmat->cmap->n < 0 && newmat->cmap->N < 0) { 750aabbc4fbSShri Abhyankar ierr = MatSetSizes(newmat,M,N,M,N);CHKERRQ(ierr); 751aabbc4fbSShri Abhyankar } else { 752aabbc4fbSShri Abhyankar /* if sizes and type are already set, check if the vector global sizes are correct */ 753aabbc4fbSShri Abhyankar ierr = MatGetSize(newmat,&grows,&gcols);CHKERRQ(ierr); 754aabbc4fbSShri Abhyankar if (M != grows || N != gcols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%d, %d) than the input matrix (%d, %d)",M,N,grows,gcols); 755aabbc4fbSShri Abhyankar } 756aabbc4fbSShri Abhyankar ierr = MatSeqDenseSetPreallocation(newmat,PETSC_NULL);CHKERRQ(ierr); 757aabbc4fbSShri Abhyankar 758aabbc4fbSShri Abhyankar if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense */ 759aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 760aabbc4fbSShri Abhyankar v = a->v; 761aabbc4fbSShri Abhyankar /* Allocate some temp space to read in the values and then flip them 762aabbc4fbSShri Abhyankar from row major to column major */ 763aabbc4fbSShri Abhyankar ierr = PetscMalloc((M*N > 0 ? M*N : 1)*sizeof(PetscScalar),&w);CHKERRQ(ierr); 764aabbc4fbSShri Abhyankar /* read in nonzero values */ 765aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,w,M*N,PETSC_SCALAR);CHKERRQ(ierr); 766aabbc4fbSShri Abhyankar /* now flip the values and store them in the matrix*/ 767aabbc4fbSShri Abhyankar for (j=0; j<N; j++) { 768aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 769aabbc4fbSShri Abhyankar *v++ =w[i*N+j]; 770aabbc4fbSShri Abhyankar } 771aabbc4fbSShri Abhyankar } 772aabbc4fbSShri Abhyankar ierr = PetscFree(w);CHKERRQ(ierr); 773aabbc4fbSShri Abhyankar } else { 774aabbc4fbSShri Abhyankar /* read row lengths */ 775aabbc4fbSShri Abhyankar ierr = PetscMalloc((M+1)*sizeof(PetscInt),&rowlengths);CHKERRQ(ierr); 776aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 777aabbc4fbSShri Abhyankar 778aabbc4fbSShri Abhyankar a = (Mat_SeqDense*)newmat->data; 779aabbc4fbSShri Abhyankar v = a->v; 780aabbc4fbSShri Abhyankar 781aabbc4fbSShri Abhyankar /* read column indices and nonzeros */ 782aabbc4fbSShri Abhyankar ierr = PetscMalloc((nz+1)*sizeof(PetscInt),&scols);CHKERRQ(ierr); 783aabbc4fbSShri Abhyankar cols = scols; 784aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,cols,nz,PETSC_INT);CHKERRQ(ierr); 785aabbc4fbSShri Abhyankar ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&svals);CHKERRQ(ierr); 786aabbc4fbSShri Abhyankar vals = svals; 787aabbc4fbSShri Abhyankar ierr = PetscBinaryRead(fd,vals,nz,PETSC_SCALAR);CHKERRQ(ierr); 788aabbc4fbSShri Abhyankar 789aabbc4fbSShri Abhyankar /* insert into matrix */ 790aabbc4fbSShri Abhyankar for (i=0; i<M; i++) { 791aabbc4fbSShri Abhyankar for (j=0; j<rowlengths[i]; j++) v[i+M*scols[j]] = svals[j]; 792aabbc4fbSShri Abhyankar svals += rowlengths[i]; scols += rowlengths[i]; 793aabbc4fbSShri Abhyankar } 794aabbc4fbSShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 795aabbc4fbSShri Abhyankar ierr = PetscFree(cols);CHKERRQ(ierr); 796aabbc4fbSShri Abhyankar ierr = PetscFree(rowlengths);CHKERRQ(ierr); 797aabbc4fbSShri Abhyankar } 798aabbc4fbSShri Abhyankar ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 799aabbc4fbSShri Abhyankar ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 800aabbc4fbSShri Abhyankar 801aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 802aabbc4fbSShri Abhyankar } 803aabbc4fbSShri Abhyankar 804aabbc4fbSShri Abhyankar #undef __FUNCT__ 8054a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_ASCII" 8066849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 807289bc588SBarry Smith { 808932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 809dfbe8321SBarry Smith PetscErrorCode ierr; 81013f74950SBarry Smith PetscInt i,j; 8112dcb1b2aSMatthew Knepley const char *name; 81287828ca2SBarry Smith PetscScalar *v; 813f3ef73ceSBarry Smith PetscViewerFormat format; 8145f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 815ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 8165f481a85SSatish Balay #endif 817932b0c3eSLois Curfman McInnes 8183a40ed3dSBarry Smith PetscFunctionBegin; 819b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 820456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 8213a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 822fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 823b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 8247566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 825d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 82644cd7ae7SLois Curfman McInnes v = a->v + i; 82777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 828d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 829aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 830329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 831a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G + %G i) ",j,PetscRealPart(*v),PetscImaginaryPart(*v));CHKERRQ(ierr); 832329f5518SBarry Smith } else if (PetscRealPart(*v)) { 833a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",j,PetscRealPart(*v));CHKERRQ(ierr); 8346831982aSBarry Smith } 83580cd9d93SLois Curfman McInnes #else 8366831982aSBarry Smith if (*v) { 837a83599f4SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %G) ",j,*v);CHKERRQ(ierr); 8386831982aSBarry Smith } 83980cd9d93SLois Curfman McInnes #endif 8401b807ce4Svictorle v += a->lda; 84180cd9d93SLois Curfman McInnes } 842b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 84380cd9d93SLois Curfman McInnes } 844b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 8453a40ed3dSBarry Smith } else { 846b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_NO);CHKERRQ(ierr); 847aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84847989497SBarry Smith /* determine if matrix has all real values */ 84947989497SBarry Smith v = a->v; 850d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 851ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break ;} 85247989497SBarry Smith } 85347989497SBarry Smith #endif 854fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 8553a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 856d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 857d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 858fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 8597566de4bSShri Abhyankar } else { 8607566de4bSShri Abhyankar ierr = PetscObjectPrintClassNamePrefixType((PetscObject)A,viewer,"Matrix Object");CHKERRQ(ierr); 861ffac6cdbSBarry Smith } 862ffac6cdbSBarry Smith 863d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 864932b0c3eSLois Curfman McInnes v = a->v + i; 865d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 866aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86747989497SBarry Smith if (allreal) { 868f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",PetscRealPart(*v));CHKERRQ(ierr); 86947989497SBarry Smith } else { 870f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16e i ",PetscRealPart(*v),PetscImaginaryPart(*v));CHKERRQ(ierr); 87147989497SBarry Smith } 872289bc588SBarry Smith #else 873f32d5d43SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",*v);CHKERRQ(ierr); 874289bc588SBarry Smith #endif 8751b807ce4Svictorle v += a->lda; 876289bc588SBarry Smith } 877b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 878289bc588SBarry Smith } 879fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 880b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 881ffac6cdbSBarry Smith } 882b0a32e0cSBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_YES);CHKERRQ(ierr); 883da3a660dSBarry Smith } 884b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 8853a40ed3dSBarry Smith PetscFunctionReturn(0); 886289bc588SBarry Smith } 887289bc588SBarry Smith 8884a2ae208SSatish Balay #undef __FUNCT__ 8894a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Binary" 8906849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_Binary(Mat A,PetscViewer viewer) 891932b0c3eSLois Curfman McInnes { 892932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 8936849ba73SBarry Smith PetscErrorCode ierr; 89413f74950SBarry Smith int fd; 895d0f46423SBarry Smith PetscInt ict,j,n = A->cmap->n,m = A->rmap->n,i,*col_lens,nz = m*n; 896f4403165SShri Abhyankar PetscScalar *v,*anonz,*vals; 897f4403165SShri Abhyankar PetscViewerFormat format; 898932b0c3eSLois Curfman McInnes 8993a40ed3dSBarry Smith PetscFunctionBegin; 900b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 90190ace30eSBarry Smith 902f4403165SShri Abhyankar ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 903f4403165SShri Abhyankar if (format == PETSC_VIEWER_NATIVE) { 904f4403165SShri Abhyankar /* store the matrix as a dense matrix */ 905f4403165SShri Abhyankar ierr = PetscMalloc(4*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 906f4403165SShri Abhyankar col_lens[0] = MAT_FILE_CLASSID; 907f4403165SShri Abhyankar col_lens[1] = m; 908f4403165SShri Abhyankar col_lens[2] = n; 909f4403165SShri Abhyankar col_lens[3] = MATRIX_BINARY_FORMAT_DENSE; 910f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,col_lens,4,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 911f4403165SShri Abhyankar ierr = PetscFree(col_lens);CHKERRQ(ierr); 912f4403165SShri Abhyankar 913f4403165SShri Abhyankar /* write out matrix, by rows */ 914f4403165SShri Abhyankar ierr = PetscMalloc((m*n+1)*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 915f4403165SShri Abhyankar v = a->v; 916f4403165SShri Abhyankar for (j=0; j<n; j++) { 917f4403165SShri Abhyankar for (i=0; i<m; i++) { 918f4403165SShri Abhyankar vals[j + i*n] = *v++; 919f4403165SShri Abhyankar } 920f4403165SShri Abhyankar } 921f4403165SShri Abhyankar ierr = PetscBinaryWrite(fd,vals,n*m,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 922f4403165SShri Abhyankar ierr = PetscFree(vals);CHKERRQ(ierr); 923f4403165SShri Abhyankar } else { 92413f74950SBarry Smith ierr = PetscMalloc((4+nz)*sizeof(PetscInt),&col_lens);CHKERRQ(ierr); 9250700a824SBarry Smith col_lens[0] = MAT_FILE_CLASSID; 926932b0c3eSLois Curfman McInnes col_lens[1] = m; 927932b0c3eSLois Curfman McInnes col_lens[2] = n; 928932b0c3eSLois Curfman McInnes col_lens[3] = nz; 929932b0c3eSLois Curfman McInnes 930932b0c3eSLois Curfman McInnes /* store lengths of each row and write (including header) to file */ 931932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) col_lens[4+i] = n; 9326f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,4+m,PETSC_INT,PETSC_TRUE);CHKERRQ(ierr); 933932b0c3eSLois Curfman McInnes 934932b0c3eSLois Curfman McInnes /* Possibly should write in smaller increments, not whole matrix at once? */ 935932b0c3eSLois Curfman McInnes /* store column indices (zero start index) */ 936932b0c3eSLois Curfman McInnes ict = 0; 937932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 938932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) col_lens[ict++] = j; 939932b0c3eSLois Curfman McInnes } 9406f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,col_lens,nz,PETSC_INT,PETSC_FALSE);CHKERRQ(ierr); 941606d414cSSatish Balay ierr = PetscFree(col_lens);CHKERRQ(ierr); 942932b0c3eSLois Curfman McInnes 943932b0c3eSLois Curfman McInnes /* store nonzero values */ 94487828ca2SBarry Smith ierr = PetscMalloc((nz+1)*sizeof(PetscScalar),&anonz);CHKERRQ(ierr); 945932b0c3eSLois Curfman McInnes ict = 0; 946932b0c3eSLois Curfman McInnes for (i=0; i<m; i++) { 947932b0c3eSLois Curfman McInnes v = a->v + i; 948932b0c3eSLois Curfman McInnes for (j=0; j<n; j++) { 9491b807ce4Svictorle anonz[ict++] = *v; v += a->lda; 950932b0c3eSLois Curfman McInnes } 951932b0c3eSLois Curfman McInnes } 9526f69ff64SBarry Smith ierr = PetscBinaryWrite(fd,anonz,nz,PETSC_SCALAR,PETSC_FALSE);CHKERRQ(ierr); 953606d414cSSatish Balay ierr = PetscFree(anonz);CHKERRQ(ierr); 954f4403165SShri Abhyankar } 9553a40ed3dSBarry Smith PetscFunctionReturn(0); 956932b0c3eSLois Curfman McInnes } 957932b0c3eSLois Curfman McInnes 9584a2ae208SSatish Balay #undef __FUNCT__ 9594a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Draw_Zoom" 960dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 961f1af5d2fSBarry Smith { 962f1af5d2fSBarry Smith Mat A = (Mat) Aa; 963f1af5d2fSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 9646849ba73SBarry Smith PetscErrorCode ierr; 965d0f46423SBarry Smith PetscInt m = A->rmap->n,n = A->cmap->n,color,i,j; 96687828ca2SBarry Smith PetscScalar *v = a->v; 967b0a32e0cSBarry Smith PetscViewer viewer; 968b0a32e0cSBarry Smith PetscDraw popup; 969329f5518SBarry Smith PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r,scale,maxv = 0.0; 970f3ef73ceSBarry Smith PetscViewerFormat format; 971f1af5d2fSBarry Smith 972f1af5d2fSBarry Smith PetscFunctionBegin; 973f1af5d2fSBarry Smith 974f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 975b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 976b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 977f1af5d2fSBarry Smith 978f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 979fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 980f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 981b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 982f1af5d2fSBarry Smith for(j = 0; j < n; j++) { 983f1af5d2fSBarry Smith x_l = j; 984f1af5d2fSBarry Smith x_r = x_l + 1.0; 985f1af5d2fSBarry Smith for(i = 0; i < m; i++) { 986f1af5d2fSBarry Smith y_l = m - i - 1.0; 987f1af5d2fSBarry Smith y_r = y_l + 1.0; 988f1af5d2fSBarry Smith #if defined(PETSC_USE_COMPLEX) 989329f5518SBarry Smith if (PetscRealPart(v[j*m+i]) > 0.) { 990b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 991329f5518SBarry Smith } else if (PetscRealPart(v[j*m+i]) < 0.) { 992b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 993f1af5d2fSBarry Smith } else { 994f1af5d2fSBarry Smith continue; 995f1af5d2fSBarry Smith } 996f1af5d2fSBarry Smith #else 997f1af5d2fSBarry Smith if (v[j*m+i] > 0.) { 998b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 999f1af5d2fSBarry Smith } else if (v[j*m+i] < 0.) { 1000b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1001f1af5d2fSBarry Smith } else { 1002f1af5d2fSBarry Smith continue; 1003f1af5d2fSBarry Smith } 1004f1af5d2fSBarry Smith #endif 1005b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1006f1af5d2fSBarry Smith } 1007f1af5d2fSBarry Smith } 1008f1af5d2fSBarry Smith } else { 1009f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1010f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1011f1af5d2fSBarry Smith for(i = 0; i < m*n; i++) { 1012f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1013f1af5d2fSBarry Smith } 1014b0a32e0cSBarry Smith scale = (245.0 - PETSC_DRAW_BASIC_COLORS)/maxv; 1015b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 1016b0a32e0cSBarry Smith if (popup) {ierr = PetscDrawScalePopup(popup,0.0,maxv);CHKERRQ(ierr);} 1017f1af5d2fSBarry Smith for(j = 0; j < n; j++) { 1018f1af5d2fSBarry Smith x_l = j; 1019f1af5d2fSBarry Smith x_r = x_l + 1.0; 1020f1af5d2fSBarry Smith for(i = 0; i < m; i++) { 1021f1af5d2fSBarry Smith y_l = m - i - 1.0; 1022f1af5d2fSBarry Smith y_r = y_l + 1.0; 1023b0a32e0cSBarry Smith color = PETSC_DRAW_BASIC_COLORS + (int)(scale*PetscAbsScalar(v[j*m+i])); 1024b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1025f1af5d2fSBarry Smith } 1026f1af5d2fSBarry Smith } 1027f1af5d2fSBarry Smith } 1028f1af5d2fSBarry Smith PetscFunctionReturn(0); 1029f1af5d2fSBarry Smith } 1030f1af5d2fSBarry Smith 10314a2ae208SSatish Balay #undef __FUNCT__ 10324a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense_Draw" 1033dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1034f1af5d2fSBarry Smith { 1035b0a32e0cSBarry Smith PetscDraw draw; 1036ace3abfcSBarry Smith PetscBool isnull; 1037329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1038dfbe8321SBarry Smith PetscErrorCode ierr; 1039f1af5d2fSBarry Smith 1040f1af5d2fSBarry Smith PetscFunctionBegin; 1041b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1042b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1043abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1044f1af5d2fSBarry Smith 1045f1af5d2fSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1046d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1047f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1048b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1049b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 1050f1af5d2fSBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",PETSC_NULL);CHKERRQ(ierr); 1051f1af5d2fSBarry Smith PetscFunctionReturn(0); 1052f1af5d2fSBarry Smith } 1053f1af5d2fSBarry Smith 10544a2ae208SSatish Balay #undef __FUNCT__ 10554a2ae208SSatish Balay #define __FUNCT__ "MatView_SeqDense" 1056dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1057932b0c3eSLois Curfman McInnes { 1058dfbe8321SBarry Smith PetscErrorCode ierr; 1059ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1060932b0c3eSLois Curfman McInnes 10613a40ed3dSBarry Smith PetscFunctionBegin; 10622692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 10632692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 10642692d6eeSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 10650f5bd95cSBarry Smith 1066c45a1595SBarry Smith if (iascii) { 1067c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 10680f5bd95cSBarry Smith } else if (isbinary) { 10693a40ed3dSBarry Smith ierr = MatView_SeqDense_Binary(A,viewer);CHKERRQ(ierr); 1070f1af5d2fSBarry Smith } else if (isdraw) { 1071f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 10725cd90555SBarry Smith } else { 1073e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Viewer type %s not supported by dense matrix",((PetscObject)viewer)->type_name); 1074932b0c3eSLois Curfman McInnes } 10753a40ed3dSBarry Smith PetscFunctionReturn(0); 1076932b0c3eSLois Curfman McInnes } 1077289bc588SBarry Smith 10784a2ae208SSatish Balay #undef __FUNCT__ 10794a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_SeqDense" 1080dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqDense(Mat mat) 1081289bc588SBarry Smith { 1082ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1083dfbe8321SBarry Smith PetscErrorCode ierr; 108490f02eecSBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 1086aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1087d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1088a5a9c739SBarry Smith #endif 108905b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 10906857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1091606d414cSSatish Balay ierr = PetscFree(l);CHKERRQ(ierr); 1092dbd8c25aSHong Zhang 1093dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 1094901853e0SKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatSeqDenseSetPreallocation_C","",PETSC_NULL);CHKERRQ(ierr); 10954ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMult_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10964ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMultSymbolic_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10974ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMatMultNumeric_seqaij_seqdense_C","",PETSC_NULL);CHKERRQ(ierr); 10983a40ed3dSBarry Smith PetscFunctionReturn(0); 1099289bc588SBarry Smith } 1100289bc588SBarry Smith 11014a2ae208SSatish Balay #undef __FUNCT__ 11024a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_SeqDense" 1103fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1104289bc588SBarry Smith { 1105c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 11066849ba73SBarry Smith PetscErrorCode ierr; 110713f74950SBarry Smith PetscInt k,j,m,n,M; 110887828ca2SBarry Smith PetscScalar *v,tmp; 110948b35521SBarry Smith 11103a40ed3dSBarry Smith PetscFunctionBegin; 1111d0f46423SBarry Smith v = mat->v; m = A->rmap->n; M = mat->lda; n = A->cmap->n; 1112e9695a30SBarry Smith if (reuse == MAT_REUSE_MATRIX && *matout == A) { /* in place transpose */ 1113e7e72b3dSBarry Smith if (m != n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Can not transpose non-square matrix in place"); 1114e7e72b3dSBarry Smith else { 1115d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1116289bc588SBarry Smith for (k=0; k<j; k++) { 11171b807ce4Svictorle tmp = v[j + k*M]; 11181b807ce4Svictorle v[j + k*M] = v[k + j*M]; 11191b807ce4Svictorle v[k + j*M] = tmp; 1120289bc588SBarry Smith } 1121289bc588SBarry Smith } 1122d64ed03dSBarry Smith } 11233a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1124d3e5ee88SLois Curfman McInnes Mat tmat; 1125ec8511deSBarry Smith Mat_SeqDense *tmatd; 112687828ca2SBarry Smith PetscScalar *v2; 1127ea709b57SSatish Balay 1128fc4dec0aSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 11297adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&tmat);CHKERRQ(ierr); 1130d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 11317adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 11325c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(tmat,PETSC_NULL);CHKERRQ(ierr); 1133fc4dec0aSBarry Smith } else { 1134fc4dec0aSBarry Smith tmat = *matout; 1135fc4dec0aSBarry Smith } 1136ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 11370de55854SLois Curfman McInnes v = mat->v; v2 = tmatd->v; 1138d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 11391b807ce4Svictorle for (k=0; k<m; k++) v2[j + k*n] = v[k + j*M]; 1140d3e5ee88SLois Curfman McInnes } 11416d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 11426d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1143d3e5ee88SLois Curfman McInnes *matout = tmat; 114448b35521SBarry Smith } 11453a40ed3dSBarry Smith PetscFunctionReturn(0); 1146289bc588SBarry Smith } 1147289bc588SBarry Smith 11484a2ae208SSatish Balay #undef __FUNCT__ 11494a2ae208SSatish Balay #define __FUNCT__ "MatEqual_SeqDense" 1150ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1151289bc588SBarry Smith { 1152c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1153c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 115413f74950SBarry Smith PetscInt i,j; 115587828ca2SBarry Smith PetscScalar *v1 = mat1->v,*v2 = mat2->v; 11569ea5d5aeSSatish Balay 11573a40ed3dSBarry Smith PetscFunctionBegin; 1158d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1159d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1160d0f46423SBarry Smith for (i=0; i<A1->rmap->n; i++) { 11611b807ce4Svictorle v1 = mat1->v+i; v2 = mat2->v+i; 1162d0f46423SBarry Smith for (j=0; j<A1->cmap->n; j++) { 11633a40ed3dSBarry Smith if (*v1 != *v2) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 11641b807ce4Svictorle v1 += mat1->lda; v2 += mat2->lda; 11651b807ce4Svictorle } 1166289bc588SBarry Smith } 116777c4ece6SBarry Smith *flg = PETSC_TRUE; 11683a40ed3dSBarry Smith PetscFunctionReturn(0); 1169289bc588SBarry Smith } 1170289bc588SBarry Smith 11714a2ae208SSatish Balay #undef __FUNCT__ 11724a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_SeqDense" 1173dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1174289bc588SBarry Smith { 1175c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1176dfbe8321SBarry Smith PetscErrorCode ierr; 117713f74950SBarry Smith PetscInt i,n,len; 117887828ca2SBarry Smith PetscScalar *x,zero = 0.0; 117944cd7ae7SLois Curfman McInnes 11803a40ed3dSBarry Smith PetscFunctionBegin; 11812dcb1b2aSMatthew Knepley ierr = VecSet(v,zero);CHKERRQ(ierr); 11827a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 11831ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1184d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1185e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 118644cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 11871b807ce4Svictorle x[i] = mat->v[i*mat->lda + i]; 1188289bc588SBarry Smith } 11891ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 11903a40ed3dSBarry Smith PetscFunctionReturn(0); 1191289bc588SBarry Smith } 1192289bc588SBarry Smith 11934a2ae208SSatish Balay #undef __FUNCT__ 11944a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_SeqDense" 1195dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1196289bc588SBarry Smith { 1197c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 119887828ca2SBarry Smith PetscScalar *l,*r,x,*v; 1199dfbe8321SBarry Smith PetscErrorCode ierr; 1200d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 120155659b69SBarry Smith 12023a40ed3dSBarry Smith PetscFunctionBegin; 120328988994SBarry Smith if (ll) { 12047a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 12051ebc52fbSHong Zhang ierr = VecGetArray(ll,&l);CHKERRQ(ierr); 1206e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1207da3a660dSBarry Smith for (i=0; i<m; i++) { 1208da3a660dSBarry Smith x = l[i]; 1209da3a660dSBarry Smith v = mat->v + i; 1210da3a660dSBarry Smith for (j=0; j<n; j++) { (*v) *= x; v+= m;} 1211da3a660dSBarry Smith } 12121ebc52fbSHong Zhang ierr = VecRestoreArray(ll,&l);CHKERRQ(ierr); 1213efee365bSSatish Balay ierr = PetscLogFlops(n*m);CHKERRQ(ierr); 1214da3a660dSBarry Smith } 121528988994SBarry Smith if (rr) { 12167a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 12171ebc52fbSHong Zhang ierr = VecGetArray(rr,&r);CHKERRQ(ierr); 1218e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1219da3a660dSBarry Smith for (i=0; i<n; i++) { 1220da3a660dSBarry Smith x = r[i]; 1221da3a660dSBarry Smith v = mat->v + i*m; 1222da3a660dSBarry Smith for (j=0; j<m; j++) { (*v++) *= x;} 1223da3a660dSBarry Smith } 12241ebc52fbSHong Zhang ierr = VecRestoreArray(rr,&r);CHKERRQ(ierr); 1225efee365bSSatish Balay ierr = PetscLogFlops(n*m);CHKERRQ(ierr); 1226da3a660dSBarry Smith } 12273a40ed3dSBarry Smith PetscFunctionReturn(0); 1228289bc588SBarry Smith } 1229289bc588SBarry Smith 12304a2ae208SSatish Balay #undef __FUNCT__ 12314a2ae208SSatish Balay #define __FUNCT__ "MatNorm_SeqDense" 1232dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1233289bc588SBarry Smith { 1234c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 123587828ca2SBarry Smith PetscScalar *v = mat->v; 1236329f5518SBarry Smith PetscReal sum = 0.0; 1237d0f46423SBarry Smith PetscInt lda=mat->lda,m=A->rmap->n,i,j; 1238efee365bSSatish Balay PetscErrorCode ierr; 123955659b69SBarry Smith 12403a40ed3dSBarry Smith PetscFunctionBegin; 1241289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1242a5ce6ee0Svictorle if (lda>m) { 1243d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1244a5ce6ee0Svictorle v = mat->v+j*lda; 1245a5ce6ee0Svictorle for (i=0; i<m; i++) { 1246a5ce6ee0Svictorle #if defined(PETSC_USE_COMPLEX) 1247a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1248a5ce6ee0Svictorle #else 1249a5ce6ee0Svictorle sum += (*v)*(*v); v++; 1250a5ce6ee0Svictorle #endif 1251a5ce6ee0Svictorle } 1252a5ce6ee0Svictorle } 1253a5ce6ee0Svictorle } else { 1254d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1255aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1256329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1257289bc588SBarry Smith #else 1258289bc588SBarry Smith sum += (*v)*(*v); v++; 1259289bc588SBarry Smith #endif 1260289bc588SBarry Smith } 1261a5ce6ee0Svictorle } 1262064f8208SBarry Smith *nrm = sqrt(sum); 1263dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 12643a40ed3dSBarry Smith } else if (type == NORM_1) { 1265064f8208SBarry Smith *nrm = 0.0; 1266d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 12671b807ce4Svictorle v = mat->v + j*mat->lda; 1268289bc588SBarry Smith sum = 0.0; 1269d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 127033a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1271289bc588SBarry Smith } 1272064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1273289bc588SBarry Smith } 1274d0f46423SBarry Smith ierr = PetscLogFlops(A->cmap->n*A->rmap->n);CHKERRQ(ierr); 12753a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1276064f8208SBarry Smith *nrm = 0.0; 1277d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1278289bc588SBarry Smith v = mat->v + j; 1279289bc588SBarry Smith sum = 0.0; 1280d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 12811b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1282289bc588SBarry Smith } 1283064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1284289bc588SBarry Smith } 1285d0f46423SBarry Smith ierr = PetscLogFlops(A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1286e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 12873a40ed3dSBarry Smith PetscFunctionReturn(0); 1288289bc588SBarry Smith } 1289289bc588SBarry Smith 12904a2ae208SSatish Balay #undef __FUNCT__ 12914a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_SeqDense" 1292ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1293289bc588SBarry Smith { 1294c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 129563ba0a88SBarry Smith PetscErrorCode ierr; 129667e560aaSBarry Smith 12973a40ed3dSBarry Smith PetscFunctionBegin; 1298b5a2b587SKris Buschelman switch (op) { 1299b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 13004e0d8c25SBarry Smith aij->roworiented = flg; 1301b5a2b587SKris Buschelman break; 1302512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1303b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13043971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 13054e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1306b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1307b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 130877e54ba9SKris Buschelman case MAT_SYMMETRIC: 130977e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 13109a4540c5SBarry Smith case MAT_HERMITIAN: 13119a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 1312600fe468SBarry Smith case MAT_IGNORE_LOWER_TRIANGULAR: 1313290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 131477e54ba9SKris Buschelman break; 1315b5a2b587SKris Buschelman default: 1316e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 13173a40ed3dSBarry Smith } 13183a40ed3dSBarry Smith PetscFunctionReturn(0); 1319289bc588SBarry Smith } 1320289bc588SBarry Smith 13214a2ae208SSatish Balay #undef __FUNCT__ 13224a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_SeqDense" 1323dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqDense(Mat A) 13246f0a148fSBarry Smith { 1325ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 13266849ba73SBarry Smith PetscErrorCode ierr; 1327d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 13283a40ed3dSBarry Smith 13293a40ed3dSBarry Smith PetscFunctionBegin; 1330a5ce6ee0Svictorle if (lda>m) { 1331d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1332a5ce6ee0Svictorle ierr = PetscMemzero(l->v+j*lda,m*sizeof(PetscScalar));CHKERRQ(ierr); 1333a5ce6ee0Svictorle } 1334a5ce6ee0Svictorle } else { 1335d0f46423SBarry Smith ierr = PetscMemzero(l->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 1336a5ce6ee0Svictorle } 13373a40ed3dSBarry Smith PetscFunctionReturn(0); 13386f0a148fSBarry Smith } 13396f0a148fSBarry Smith 13404a2ae208SSatish Balay #undef __FUNCT__ 13414a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_SeqDense" 13422b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 13436f0a148fSBarry Smith { 1344*97b48c8fSBarry Smith PetscErrorCode ierr; 1345ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1346d0f46423SBarry Smith PetscInt n = A->cmap->n,i,j; 1347*97b48c8fSBarry Smith PetscScalar *slot,*bb; 1348*97b48c8fSBarry Smith const PetscScalar *xx; 134955659b69SBarry Smith 13503a40ed3dSBarry Smith PetscFunctionBegin; 1351*97b48c8fSBarry Smith /* fix right hand side if needed */ 1352*97b48c8fSBarry Smith if (x && b) { 1353*97b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 1354*97b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 1355*97b48c8fSBarry Smith for (i=0; i<N; i++) { 1356*97b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 1357*97b48c8fSBarry Smith } 1358*97b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 1359*97b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 1360*97b48c8fSBarry Smith } 1361*97b48c8fSBarry Smith 13626f0a148fSBarry Smith for (i=0; i<N; i++) { 13636f0a148fSBarry Smith slot = l->v + rows[i]; 13646f0a148fSBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += n;} 13656f0a148fSBarry Smith } 1366f4df32b1SMatthew Knepley if (diag != 0.0) { 13676f0a148fSBarry Smith for (i=0; i<N; i++) { 13686f0a148fSBarry Smith slot = l->v + (n+1)*rows[i]; 1369f4df32b1SMatthew Knepley *slot = diag; 13706f0a148fSBarry Smith } 13716f0a148fSBarry Smith } 13723a40ed3dSBarry Smith PetscFunctionReturn(0); 13736f0a148fSBarry Smith } 1374557bce09SLois Curfman McInnes 13754a2ae208SSatish Balay #undef __FUNCT__ 13764a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_SeqDense" 1377dfbe8321SBarry Smith PetscErrorCode MatGetArray_SeqDense(Mat A,PetscScalar *array[]) 137864e87e97SBarry Smith { 1379c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 13803a40ed3dSBarry Smith 13813a40ed3dSBarry Smith PetscFunctionBegin; 1382e32f2f54SBarry Smith if (mat->lda != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot get array for Dense matrices with LDA different from number of rows"); 138364e87e97SBarry Smith *array = mat->v; 13843a40ed3dSBarry Smith PetscFunctionReturn(0); 138564e87e97SBarry Smith } 13860754003eSLois Curfman McInnes 13874a2ae208SSatish Balay #undef __FUNCT__ 13884a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_SeqDense" 1389dfbe8321SBarry Smith PetscErrorCode MatRestoreArray_SeqDense(Mat A,PetscScalar *array[]) 1390ff14e315SSatish Balay { 13913a40ed3dSBarry Smith PetscFunctionBegin; 139209b544d4SBarry Smith *array = 0; /* user cannot accidently use the array later */ 13933a40ed3dSBarry Smith PetscFunctionReturn(0); 1394ff14e315SSatish Balay } 13950754003eSLois Curfman McInnes 13964a2ae208SSatish Balay #undef __FUNCT__ 13974a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_SeqDense" 139813f74950SBarry Smith static PetscErrorCode MatGetSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 13990754003eSLois Curfman McInnes { 1400c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 14016849ba73SBarry Smith PetscErrorCode ierr; 14025d0c19d7SBarry Smith PetscInt i,j,nrows,ncols; 14035d0c19d7SBarry Smith const PetscInt *irow,*icol; 140487828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 14050754003eSLois Curfman McInnes Mat newmat; 14060754003eSLois Curfman McInnes 14073a40ed3dSBarry Smith PetscFunctionBegin; 140878b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 140978b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 1410e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 1411e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 14120754003eSLois Curfman McInnes 1413182d2002SSatish Balay /* Check submatrixcall */ 1414182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 141513f74950SBarry Smith PetscInt n_cols,n_rows; 1416182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 141721a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 141821a2c019SBarry Smith /* resize the result result matrix to match number of requested rows/columns */ 1419c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 142021a2c019SBarry Smith } 1421182d2002SSatish Balay newmat = *B; 1422182d2002SSatish Balay } else { 14230754003eSLois Curfman McInnes /* Create and fill new matrix */ 14247adad957SLisandro Dalcin ierr = MatCreate(((PetscObject)A)->comm,&newmat);CHKERRQ(ierr); 1425f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 14267adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 14275c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(newmat,PETSC_NULL);CHKERRQ(ierr); 1428182d2002SSatish Balay } 1429182d2002SSatish Balay 1430182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 1431182d2002SSatish Balay bv = ((Mat_SeqDense*)newmat->data)->v; 1432182d2002SSatish Balay 1433182d2002SSatish Balay for (i=0; i<ncols; i++) { 14346de62eeeSBarry Smith av = v + mat->lda*icol[i]; 1435182d2002SSatish Balay for (j=0; j<nrows; j++) { 1436182d2002SSatish Balay *bv++ = av[irow[j]]; 14370754003eSLois Curfman McInnes } 14380754003eSLois Curfman McInnes } 1439182d2002SSatish Balay 1440182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 14416d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14426d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14430754003eSLois Curfman McInnes 14440754003eSLois Curfman McInnes /* Free work space */ 144578b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 144678b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 1447182d2002SSatish Balay *B = newmat; 14483a40ed3dSBarry Smith PetscFunctionReturn(0); 14490754003eSLois Curfman McInnes } 14500754003eSLois Curfman McInnes 14514a2ae208SSatish Balay #undef __FUNCT__ 14524a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrices_SeqDense" 145313f74950SBarry Smith PetscErrorCode MatGetSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 1454905e6a2fSBarry Smith { 14556849ba73SBarry Smith PetscErrorCode ierr; 145613f74950SBarry Smith PetscInt i; 1457905e6a2fSBarry Smith 14583a40ed3dSBarry Smith PetscFunctionBegin; 1459905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 1460b0a32e0cSBarry Smith ierr = PetscMalloc((n+1)*sizeof(Mat),B);CHKERRQ(ierr); 1461905e6a2fSBarry Smith } 1462905e6a2fSBarry Smith 1463905e6a2fSBarry Smith for (i=0; i<n; i++) { 14646a6a5d1dSBarry Smith ierr = MatGetSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 1465905e6a2fSBarry Smith } 14663a40ed3dSBarry Smith PetscFunctionReturn(0); 1467905e6a2fSBarry Smith } 1468905e6a2fSBarry Smith 14694a2ae208SSatish Balay #undef __FUNCT__ 1470c0aa2d19SHong Zhang #define __FUNCT__ "MatAssemblyBegin_SeqDense" 1471c0aa2d19SHong Zhang PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 1472c0aa2d19SHong Zhang { 1473c0aa2d19SHong Zhang PetscFunctionBegin; 1474c0aa2d19SHong Zhang PetscFunctionReturn(0); 1475c0aa2d19SHong Zhang } 1476c0aa2d19SHong Zhang 1477c0aa2d19SHong Zhang #undef __FUNCT__ 1478c0aa2d19SHong Zhang #define __FUNCT__ "MatAssemblyEnd_SeqDense" 1479c0aa2d19SHong Zhang PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 1480c0aa2d19SHong Zhang { 1481c0aa2d19SHong Zhang PetscFunctionBegin; 1482c0aa2d19SHong Zhang PetscFunctionReturn(0); 1483c0aa2d19SHong Zhang } 1484c0aa2d19SHong Zhang 1485c0aa2d19SHong Zhang #undef __FUNCT__ 14864a2ae208SSatish Balay #define __FUNCT__ "MatCopy_SeqDense" 1487dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 14884b0e389bSBarry Smith { 14894b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense *)B->data; 14906849ba73SBarry Smith PetscErrorCode ierr; 1491d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 14923a40ed3dSBarry Smith 14933a40ed3dSBarry Smith PetscFunctionBegin; 149433f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 149533f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 1496cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 14973a40ed3dSBarry Smith PetscFunctionReturn(0); 14983a40ed3dSBarry Smith } 1499e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 1500a5ce6ee0Svictorle if (lda1>m || lda2>m) { 15010dbb7854Svictorle for (j=0; j<n; j++) { 1502a5ce6ee0Svictorle ierr = PetscMemcpy(b->v+j*lda2,a->v+j*lda1,m*sizeof(PetscScalar));CHKERRQ(ierr); 1503a5ce6ee0Svictorle } 1504a5ce6ee0Svictorle } else { 1505d0f46423SBarry Smith ierr = PetscMemcpy(b->v,a->v,A->rmap->n*A->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 1506a5ce6ee0Svictorle } 1507273d9f13SBarry Smith PetscFunctionReturn(0); 1508273d9f13SBarry Smith } 1509273d9f13SBarry Smith 15104a2ae208SSatish Balay #undef __FUNCT__ 15114a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_SeqDense" 1512dfbe8321SBarry Smith PetscErrorCode MatSetUpPreallocation_SeqDense(Mat A) 1513273d9f13SBarry Smith { 1514dfbe8321SBarry Smith PetscErrorCode ierr; 1515273d9f13SBarry Smith 1516273d9f13SBarry Smith PetscFunctionBegin; 1517273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 15183a40ed3dSBarry Smith PetscFunctionReturn(0); 15194b0e389bSBarry Smith } 15204b0e389bSBarry Smith 1521284134d9SBarry Smith #undef __FUNCT__ 1522284134d9SBarry Smith #define __FUNCT__ "MatSetSizes_SeqDense" 1523284134d9SBarry Smith PetscErrorCode MatSetSizes_SeqDense(Mat A,PetscInt m,PetscInt n,PetscInt M,PetscInt N) 1524284134d9SBarry Smith { 1525284134d9SBarry Smith PetscFunctionBegin; 152621a2c019SBarry Smith /* this will not be called before lda, Mmax, and Nmax have been set */ 1527284134d9SBarry Smith m = PetscMax(m,M); 1528284134d9SBarry Smith n = PetscMax(n,N); 1529a868139aSShri Abhyankar 153086d161a7SShri Abhyankar /* if (m > a->Mmax) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot yet resize number rows of dense matrix larger then its initial size %d, requested %d",a->lda,(int)m); 153186d161a7SShri Abhyankar if (n > a->Nmax) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot yet resize number columns of dense matrix larger then its initial size %d, requested %d",a->Nmax,(int)n); 153286d161a7SShri Abhyankar */ 1533dc5cefdeSJed Brown A->rmap->n = A->rmap->N = m; 1534d0f46423SBarry Smith A->cmap->n = A->cmap->N = n; 1535284134d9SBarry Smith PetscFunctionReturn(0); 1536284134d9SBarry Smith } 1537170fe5c8SBarry Smith 1538ba337c44SJed Brown #undef __FUNCT__ 1539ba337c44SJed Brown #define __FUNCT__ "MatConjugate_SeqDense" 1540ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 1541ba337c44SJed Brown { 1542ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1543ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1544ba337c44SJed Brown PetscScalar *aa = a->v; 1545ba337c44SJed Brown 1546ba337c44SJed Brown PetscFunctionBegin; 1547ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 1548ba337c44SJed Brown PetscFunctionReturn(0); 1549ba337c44SJed Brown } 1550ba337c44SJed Brown 1551ba337c44SJed Brown #undef __FUNCT__ 1552ba337c44SJed Brown #define __FUNCT__ "MatRealPart_SeqDense" 1553ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 1554ba337c44SJed Brown { 1555ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1556ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1557ba337c44SJed Brown PetscScalar *aa = a->v; 1558ba337c44SJed Brown 1559ba337c44SJed Brown PetscFunctionBegin; 1560ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1561ba337c44SJed Brown PetscFunctionReturn(0); 1562ba337c44SJed Brown } 1563ba337c44SJed Brown 1564ba337c44SJed Brown #undef __FUNCT__ 1565ba337c44SJed Brown #define __FUNCT__ "MatImaginaryPart_SeqDense" 1566ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 1567ba337c44SJed Brown { 1568ba337c44SJed Brown Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1569ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 1570ba337c44SJed Brown PetscScalar *aa = a->v; 1571ba337c44SJed Brown 1572ba337c44SJed Brown PetscFunctionBegin; 1573ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1574ba337c44SJed Brown PetscFunctionReturn(0); 1575ba337c44SJed Brown } 1576284134d9SBarry Smith 1577a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 1578a9fe9ddaSSatish Balay #undef __FUNCT__ 1579a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMult_SeqDense_SeqDense" 1580a9fe9ddaSSatish Balay PetscErrorCode MatMatMult_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 1581a9fe9ddaSSatish Balay { 1582a9fe9ddaSSatish Balay PetscErrorCode ierr; 1583a9fe9ddaSSatish Balay 1584a9fe9ddaSSatish Balay PetscFunctionBegin; 1585a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX){ 1586a9fe9ddaSSatish Balay ierr = MatMatMultSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 1587a9fe9ddaSSatish Balay } 1588a9fe9ddaSSatish Balay ierr = MatMatMultNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 1589a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1590a9fe9ddaSSatish Balay } 1591a9fe9ddaSSatish Balay 1592a9fe9ddaSSatish Balay #undef __FUNCT__ 1593a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultSymbolic_SeqDense_SeqDense" 1594a9fe9ddaSSatish Balay PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 1595a9fe9ddaSSatish Balay { 1596ee16a9a1SHong Zhang PetscErrorCode ierr; 1597d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 1598ee16a9a1SHong Zhang Mat Cmat; 1599a9fe9ddaSSatish Balay 1600ee16a9a1SHong Zhang PetscFunctionBegin; 1601e32f2f54SBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %d != B->rmap->n %d\n",A->cmap->n,B->rmap->n); 1602ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 1603ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 1604ee16a9a1SHong Zhang ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 1605ee16a9a1SHong Zhang ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 1606ee16a9a1SHong Zhang Cmat->assembled = PETSC_TRUE; 1607ee16a9a1SHong Zhang *C = Cmat; 1608ee16a9a1SHong Zhang PetscFunctionReturn(0); 1609ee16a9a1SHong Zhang } 1610a9fe9ddaSSatish Balay 161198a3b096SSatish Balay #undef __FUNCT__ 1612a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultNumeric_SeqDense_SeqDense" 1613a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 1614a9fe9ddaSSatish Balay { 1615a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1616a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 1617a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 16180805154bSBarry Smith PetscBLASInt m,n,k; 1619a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 1620a9fe9ddaSSatish Balay 1621a9fe9ddaSSatish Balay PetscFunctionBegin; 1622d0f46423SBarry Smith m = PetscBLASIntCast(A->rmap->n); 1623d0f46423SBarry Smith n = PetscBLASIntCast(B->cmap->n); 1624d0f46423SBarry Smith k = PetscBLASIntCast(A->cmap->n); 1625a9fe9ddaSSatish Balay BLASgemm_("N","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda); 1626a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1627a9fe9ddaSSatish Balay } 1628a9fe9ddaSSatish Balay 1629a9fe9ddaSSatish Balay #undef __FUNCT__ 1630a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTranspose_SeqDense_SeqDense" 1631a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTranspose_SeqDense_SeqDense(Mat A,Mat B,MatReuse scall,PetscReal fill,Mat *C) 1632a9fe9ddaSSatish Balay { 1633a9fe9ddaSSatish Balay PetscErrorCode ierr; 1634a9fe9ddaSSatish Balay 1635a9fe9ddaSSatish Balay PetscFunctionBegin; 1636a9fe9ddaSSatish Balay if (scall == MAT_INITIAL_MATRIX){ 1637a9fe9ddaSSatish Balay ierr = MatMatMultTransposeSymbolic_SeqDense_SeqDense(A,B,fill,C);CHKERRQ(ierr); 1638a9fe9ddaSSatish Balay } 1639a9fe9ddaSSatish Balay ierr = MatMatMultTransposeNumeric_SeqDense_SeqDense(A,B,*C);CHKERRQ(ierr); 1640a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1641a9fe9ddaSSatish Balay } 1642a9fe9ddaSSatish Balay 1643a9fe9ddaSSatish Balay #undef __FUNCT__ 1644a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTransposeSymbolic_SeqDense_SeqDense" 1645a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTransposeSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat *C) 1646a9fe9ddaSSatish Balay { 1647ee16a9a1SHong Zhang PetscErrorCode ierr; 1648d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 1649ee16a9a1SHong Zhang Mat Cmat; 1650a9fe9ddaSSatish Balay 1651ee16a9a1SHong Zhang PetscFunctionBegin; 1652e32f2f54SBarry Smith if (A->rmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->rmap->n %d != B->rmap->n %d\n",A->rmap->n,B->rmap->n); 1653ee16a9a1SHong Zhang ierr = MatCreate(PETSC_COMM_SELF,&Cmat);CHKERRQ(ierr); 1654ee16a9a1SHong Zhang ierr = MatSetSizes(Cmat,m,n,m,n);CHKERRQ(ierr); 1655ee16a9a1SHong Zhang ierr = MatSetType(Cmat,MATSEQDENSE);CHKERRQ(ierr); 1656ee16a9a1SHong Zhang ierr = MatSeqDenseSetPreallocation(Cmat,PETSC_NULL);CHKERRQ(ierr); 1657ee16a9a1SHong Zhang Cmat->assembled = PETSC_TRUE; 1658ee16a9a1SHong Zhang *C = Cmat; 1659ee16a9a1SHong Zhang PetscFunctionReturn(0); 1660ee16a9a1SHong Zhang } 1661a9fe9ddaSSatish Balay 1662a9fe9ddaSSatish Balay #undef __FUNCT__ 1663a9fe9ddaSSatish Balay #define __FUNCT__ "MatMatMultTransposeNumeric_SeqDense_SeqDense" 1664a9fe9ddaSSatish Balay PetscErrorCode MatMatMultTransposeNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 1665a9fe9ddaSSatish Balay { 1666a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1667a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 1668a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 16690805154bSBarry Smith PetscBLASInt m,n,k; 1670a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 1671a9fe9ddaSSatish Balay 1672a9fe9ddaSSatish Balay PetscFunctionBegin; 1673d0f46423SBarry Smith m = PetscBLASIntCast(A->cmap->n); 1674d0f46423SBarry Smith n = PetscBLASIntCast(B->cmap->n); 1675d0f46423SBarry Smith k = PetscBLASIntCast(A->rmap->n); 16762fbe02b9SBarry Smith /* 16772fbe02b9SBarry Smith Note the m and n arguments below are the number rows and columns of A', not A! 16782fbe02b9SBarry Smith */ 1679a9fe9ddaSSatish Balay BLASgemm_("T","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda); 1680a9fe9ddaSSatish Balay PetscFunctionReturn(0); 1681a9fe9ddaSSatish Balay } 1682985db425SBarry Smith 1683985db425SBarry Smith #undef __FUNCT__ 1684985db425SBarry Smith #define __FUNCT__ "MatGetRowMax_SeqDense" 1685985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 1686985db425SBarry Smith { 1687985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1688985db425SBarry Smith PetscErrorCode ierr; 1689d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1690985db425SBarry Smith PetscScalar *x; 1691985db425SBarry Smith MatScalar *aa = a->v; 1692985db425SBarry Smith 1693985db425SBarry Smith PetscFunctionBegin; 1694e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1695985db425SBarry Smith 1696985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1697985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1698985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1699e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1700985db425SBarry Smith for (i=0; i<m; i++) { 1701985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 1702985db425SBarry Smith for (j=1; j<n; j++){ 1703985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(aa[i+m*j])) {x[i] = aa[i + m*j]; if (idx) idx[i] = j;} 1704985db425SBarry Smith } 1705985db425SBarry Smith } 1706985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1707985db425SBarry Smith PetscFunctionReturn(0); 1708985db425SBarry Smith } 1709985db425SBarry Smith 1710985db425SBarry Smith #undef __FUNCT__ 1711985db425SBarry Smith #define __FUNCT__ "MatGetRowMaxAbs_SeqDense" 1712985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 1713985db425SBarry Smith { 1714985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1715985db425SBarry Smith PetscErrorCode ierr; 1716d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1717985db425SBarry Smith PetscScalar *x; 1718985db425SBarry Smith PetscReal atmp; 1719985db425SBarry Smith MatScalar *aa = a->v; 1720985db425SBarry Smith 1721985db425SBarry Smith PetscFunctionBegin; 1722e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1723985db425SBarry Smith 1724985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1725985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1726985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1727e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1728985db425SBarry Smith for (i=0; i<m; i++) { 17299189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 1730985db425SBarry Smith for (j=1; j<n; j++){ 1731985db425SBarry Smith atmp = PetscAbsScalar(aa[i+m*j]); 1732985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 1733985db425SBarry Smith } 1734985db425SBarry Smith } 1735985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1736985db425SBarry Smith PetscFunctionReturn(0); 1737985db425SBarry Smith } 1738985db425SBarry Smith 1739985db425SBarry Smith #undef __FUNCT__ 1740985db425SBarry Smith #define __FUNCT__ "MatGetRowMin_SeqDense" 1741985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 1742985db425SBarry Smith { 1743985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1744985db425SBarry Smith PetscErrorCode ierr; 1745d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 1746985db425SBarry Smith PetscScalar *x; 1747985db425SBarry Smith MatScalar *aa = a->v; 1748985db425SBarry Smith 1749985db425SBarry Smith PetscFunctionBegin; 1750e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 1751985db425SBarry Smith 1752985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 1753985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1754985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 1755e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 1756985db425SBarry Smith for (i=0; i<m; i++) { 1757985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 1758985db425SBarry Smith for (j=1; j<n; j++){ 1759985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(aa[i+m*j])) {x[i] = aa[i + m*j]; if (idx) idx[i] = j;} 1760985db425SBarry Smith } 1761985db425SBarry Smith } 1762985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 1763985db425SBarry Smith PetscFunctionReturn(0); 1764985db425SBarry Smith } 1765985db425SBarry Smith 17668d0534beSBarry Smith #undef __FUNCT__ 17678d0534beSBarry Smith #define __FUNCT__ "MatGetColumnVector_SeqDense" 17688d0534beSBarry Smith PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 17698d0534beSBarry Smith { 17708d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 17718d0534beSBarry Smith PetscErrorCode ierr; 17728d0534beSBarry Smith PetscScalar *x; 17738d0534beSBarry Smith 17748d0534beSBarry Smith PetscFunctionBegin; 1775e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 17768d0534beSBarry Smith 17778d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1778d0f46423SBarry Smith ierr = PetscMemcpy(x,a->v+col*a->lda,A->rmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 17798d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 17808d0534beSBarry Smith PetscFunctionReturn(0); 17818d0534beSBarry Smith } 17828d0534beSBarry Smith 1783289bc588SBarry Smith /* -------------------------------------------------------------------*/ 1784a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqDense, 1785905e6a2fSBarry Smith MatGetRow_SeqDense, 1786905e6a2fSBarry Smith MatRestoreRow_SeqDense, 1787905e6a2fSBarry Smith MatMult_SeqDense, 178897304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 17897c922b88SBarry Smith MatMultTranspose_SeqDense, 17907c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 1791db4efbfdSBarry Smith 0, 1792db4efbfdSBarry Smith 0, 1793db4efbfdSBarry Smith 0, 1794db4efbfdSBarry Smith /*10*/ 0, 1795905e6a2fSBarry Smith MatLUFactor_SeqDense, 1796905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 179741f059aeSBarry Smith MatSOR_SeqDense, 1798ec8511deSBarry Smith MatTranspose_SeqDense, 179997304618SKris Buschelman /*15*/ MatGetInfo_SeqDense, 1800905e6a2fSBarry Smith MatEqual_SeqDense, 1801905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 1802905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 1803905e6a2fSBarry Smith MatNorm_SeqDense, 1804c0aa2d19SHong Zhang /*20*/ MatAssemblyBegin_SeqDense, 1805c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 1806905e6a2fSBarry Smith MatSetOption_SeqDense, 1807905e6a2fSBarry Smith MatZeroEntries_SeqDense, 1808d519adbfSMatthew Knepley /*24*/ MatZeroRows_SeqDense, 1809db4efbfdSBarry Smith 0, 1810db4efbfdSBarry Smith 0, 1811db4efbfdSBarry Smith 0, 1812db4efbfdSBarry Smith 0, 1813d519adbfSMatthew Knepley /*29*/ MatSetUpPreallocation_SeqDense, 1814273d9f13SBarry Smith 0, 1815905e6a2fSBarry Smith 0, 1816905e6a2fSBarry Smith MatGetArray_SeqDense, 1817905e6a2fSBarry Smith MatRestoreArray_SeqDense, 1818d519adbfSMatthew Knepley /*34*/ MatDuplicate_SeqDense, 1819a5ae1ecdSBarry Smith 0, 1820a5ae1ecdSBarry Smith 0, 1821a5ae1ecdSBarry Smith 0, 1822a5ae1ecdSBarry Smith 0, 1823d519adbfSMatthew Knepley /*39*/ MatAXPY_SeqDense, 1824a5ae1ecdSBarry Smith MatGetSubMatrices_SeqDense, 1825a5ae1ecdSBarry Smith 0, 18264b0e389bSBarry Smith MatGetValues_SeqDense, 1827a5ae1ecdSBarry Smith MatCopy_SeqDense, 1828d519adbfSMatthew Knepley /*44*/ MatGetRowMax_SeqDense, 1829a5ae1ecdSBarry Smith MatScale_SeqDense, 1830a5ae1ecdSBarry Smith 0, 1831a5ae1ecdSBarry Smith 0, 1832a5ae1ecdSBarry Smith 0, 1833d519adbfSMatthew Knepley /*49*/ 0, 1834a5ae1ecdSBarry Smith 0, 1835a5ae1ecdSBarry Smith 0, 1836a5ae1ecdSBarry Smith 0, 1837a5ae1ecdSBarry Smith 0, 1838d519adbfSMatthew Knepley /*54*/ 0, 1839a5ae1ecdSBarry Smith 0, 1840a5ae1ecdSBarry Smith 0, 1841a5ae1ecdSBarry Smith 0, 1842a5ae1ecdSBarry Smith 0, 1843d519adbfSMatthew Knepley /*59*/ 0, 1844e03a110bSBarry Smith MatDestroy_SeqDense, 1845e03a110bSBarry Smith MatView_SeqDense, 1846357abbc8SBarry Smith 0, 184797304618SKris Buschelman 0, 1848d519adbfSMatthew Knepley /*64*/ 0, 184997304618SKris Buschelman 0, 185097304618SKris Buschelman 0, 185197304618SKris Buschelman 0, 185297304618SKris Buschelman 0, 1853d519adbfSMatthew Knepley /*69*/ MatGetRowMaxAbs_SeqDense, 185497304618SKris Buschelman 0, 185597304618SKris Buschelman 0, 185697304618SKris Buschelman 0, 185797304618SKris Buschelman 0, 1858d519adbfSMatthew Knepley /*74*/ 0, 185997304618SKris Buschelman 0, 186097304618SKris Buschelman 0, 186197304618SKris Buschelman 0, 186297304618SKris Buschelman 0, 1863d519adbfSMatthew Knepley /*79*/ 0, 186497304618SKris Buschelman 0, 186597304618SKris Buschelman 0, 186697304618SKris Buschelman 0, 18675bba2384SShri Abhyankar /*83*/ MatLoad_SeqDense, 1868865e5f61SKris Buschelman 0, 18691cbb95d3SBarry Smith MatIsHermitian_SeqDense, 1870865e5f61SKris Buschelman 0, 1871865e5f61SKris Buschelman 0, 1872865e5f61SKris Buschelman 0, 1873d519adbfSMatthew Knepley /*89*/ MatMatMult_SeqDense_SeqDense, 1874a9fe9ddaSSatish Balay MatMatMultSymbolic_SeqDense_SeqDense, 1875a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 1876865e5f61SKris Buschelman 0, 1877865e5f61SKris Buschelman 0, 1878d519adbfSMatthew Knepley /*94*/ 0, 1879a9fe9ddaSSatish Balay MatMatMultTranspose_SeqDense_SeqDense, 1880a9fe9ddaSSatish Balay MatMatMultTransposeSymbolic_SeqDense_SeqDense, 1881a9fe9ddaSSatish Balay MatMatMultTransposeNumeric_SeqDense_SeqDense, 1882284134d9SBarry Smith 0, 1883d519adbfSMatthew Knepley /*99*/ 0, 1884284134d9SBarry Smith 0, 1885284134d9SBarry Smith 0, 1886ba337c44SJed Brown MatConjugate_SeqDense, 1887985db425SBarry Smith MatSetSizes_SeqDense, 1888ba337c44SJed Brown /*104*/0, 1889ba337c44SJed Brown MatRealPart_SeqDense, 1890ba337c44SJed Brown MatImaginaryPart_SeqDense, 1891985db425SBarry Smith 0, 1892985db425SBarry Smith 0, 1893d519adbfSMatthew Knepley /*109*/0, 1894985db425SBarry Smith 0, 18958d0534beSBarry Smith MatGetRowMin_SeqDense, 1896aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 1897aabbc4fbSShri Abhyankar 0, 1898aabbc4fbSShri Abhyankar /*114*/0, 1899aabbc4fbSShri Abhyankar 0, 1900aabbc4fbSShri Abhyankar 0, 1901aabbc4fbSShri Abhyankar 0, 1902aabbc4fbSShri Abhyankar 0, 1903aabbc4fbSShri Abhyankar /*119*/0, 1904aabbc4fbSShri Abhyankar 0, 1905aabbc4fbSShri Abhyankar 0, 19065bba2384SShri Abhyankar 0 1907985db425SBarry Smith }; 190890ace30eSBarry Smith 19094a2ae208SSatish Balay #undef __FUNCT__ 19104a2ae208SSatish Balay #define __FUNCT__ "MatCreateSeqDense" 19114b828684SBarry Smith /*@C 1912fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 1913d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 1914d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 1915289bc588SBarry Smith 1916db81eaa0SLois Curfman McInnes Collective on MPI_Comm 1917db81eaa0SLois Curfman McInnes 191820563c6bSBarry Smith Input Parameters: 1919db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 19200c775827SLois Curfman McInnes . m - number of rows 192118f449edSLois Curfman McInnes . n - number of columns 1922c0235b3cSMatthew Knepley - data - optional location of matrix data in column major order. Set data=PETSC_NULL for PETSc 1923dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 192420563c6bSBarry Smith 192520563c6bSBarry Smith Output Parameter: 192644cd7ae7SLois Curfman McInnes . A - the matrix 192720563c6bSBarry Smith 1928b259b22eSLois Curfman McInnes Notes: 192918f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 193018f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 1931b4fd4287SBarry Smith set data=PETSC_NULL. 193218f449edSLois Curfman McInnes 1933027ccd11SLois Curfman McInnes Level: intermediate 1934027ccd11SLois Curfman McInnes 1935dbd7a890SLois Curfman McInnes .keywords: dense, matrix, LAPACK, BLAS 1936d65003e9SLois Curfman McInnes 1937db81eaa0SLois Curfman McInnes .seealso: MatCreate(), MatCreateMPIDense(), MatSetValues() 193820563c6bSBarry Smith @*/ 1939be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 1940289bc588SBarry Smith { 1941dfbe8321SBarry Smith PetscErrorCode ierr; 19423b2fbd54SBarry Smith 19433a40ed3dSBarry Smith PetscFunctionBegin; 1944f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 1945f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 1946273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 1947273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 1948273d9f13SBarry Smith PetscFunctionReturn(0); 1949273d9f13SBarry Smith } 1950273d9f13SBarry Smith 19514a2ae208SSatish Balay #undef __FUNCT__ 1952afc30d2aSLisandro Dalcin #define __FUNCT__ "MatSeqDenseSetPreallocation" 1953273d9f13SBarry Smith /*@C 1954273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 1955273d9f13SBarry Smith 1956273d9f13SBarry Smith Collective on MPI_Comm 1957273d9f13SBarry Smith 1958273d9f13SBarry Smith Input Parameters: 1959273d9f13SBarry Smith + A - the matrix 1960273d9f13SBarry Smith - data - the array (or PETSC_NULL) 1961273d9f13SBarry Smith 1962273d9f13SBarry Smith Notes: 1963273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 1964273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 1965284134d9SBarry Smith need not call this routine. 1966273d9f13SBarry Smith 1967273d9f13SBarry Smith Level: intermediate 1968273d9f13SBarry Smith 1969273d9f13SBarry Smith .keywords: dense, matrix, LAPACK, BLAS 1970273d9f13SBarry Smith 1971867c911aSBarry Smith .seealso: MatCreate(), MatCreateMPIDense(), MatSetValues(), MatSeqDenseSetLDA() 1972867c911aSBarry Smith 1973273d9f13SBarry Smith @*/ 1974be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 1975273d9f13SBarry Smith { 19764ac538c5SBarry Smith PetscErrorCode ierr; 1977a23d5eceSKris Buschelman 1978a23d5eceSKris Buschelman PetscFunctionBegin; 19794ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 1980a23d5eceSKris Buschelman PetscFunctionReturn(0); 1981a23d5eceSKris Buschelman } 1982a23d5eceSKris Buschelman 1983a23d5eceSKris Buschelman EXTERN_C_BEGIN 1984a23d5eceSKris Buschelman #undef __FUNCT__ 1985afc30d2aSLisandro Dalcin #define __FUNCT__ "MatSeqDenseSetPreallocation_SeqDense" 1986be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 1987a23d5eceSKris Buschelman { 1988273d9f13SBarry Smith Mat_SeqDense *b; 1989dfbe8321SBarry Smith PetscErrorCode ierr; 1990273d9f13SBarry Smith 1991273d9f13SBarry Smith PetscFunctionBegin; 1992273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 1993a868139aSShri Abhyankar 199434ef9618SShri Abhyankar ierr = PetscLayoutSetBlockSize(B->rmap,1);CHKERRQ(ierr); 199534ef9618SShri Abhyankar ierr = PetscLayoutSetBlockSize(B->cmap,1);CHKERRQ(ierr); 199634ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 199734ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 199834ef9618SShri Abhyankar 1999273d9f13SBarry Smith b = (Mat_SeqDense*)B->data; 200086d161a7SShri Abhyankar b->Mmax = B->rmap->n; 200186d161a7SShri Abhyankar b->Nmax = B->cmap->n; 200286d161a7SShri Abhyankar if(b->lda <= 0 || b->changelda) b->lda = B->rmap->n; 200386d161a7SShri Abhyankar 20049e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 20059e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 20065afd5e0cSBarry Smith ierr = PetscMalloc(b->lda*b->Nmax*sizeof(PetscScalar),&b->v);CHKERRQ(ierr); 2007284134d9SBarry Smith ierr = PetscMemzero(b->v,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 2008284134d9SBarry Smith ierr = PetscLogObjectMemory(B,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 20099e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 2010273d9f13SBarry Smith } else { /* user-allocated storage */ 20119e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2012273d9f13SBarry Smith b->v = data; 2013273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2014273d9f13SBarry Smith } 20150450473dSBarry Smith B->assembled = PETSC_TRUE; 2016273d9f13SBarry Smith PetscFunctionReturn(0); 2017273d9f13SBarry Smith } 2018a23d5eceSKris Buschelman EXTERN_C_END 2019273d9f13SBarry Smith 20201b807ce4Svictorle #undef __FUNCT__ 20211b807ce4Svictorle #define __FUNCT__ "MatSeqDenseSetLDA" 20221b807ce4Svictorle /*@C 20231b807ce4Svictorle MatSeqDenseSetLDA - Declare the leading dimension of the user-provided array 20241b807ce4Svictorle 20251b807ce4Svictorle Input parameter: 20261b807ce4Svictorle + A - the matrix 20271b807ce4Svictorle - lda - the leading dimension 20281b807ce4Svictorle 20291b807ce4Svictorle Notes: 2030867c911aSBarry Smith This routine is to be used in conjunction with MatSeqDenseSetPreallocation(); 20311b807ce4Svictorle it asserts that the preallocation has a leading dimension (the LDA parameter 20321b807ce4Svictorle of Blas and Lapack fame) larger than M, the first dimension of the matrix. 20331b807ce4Svictorle 20341b807ce4Svictorle Level: intermediate 20351b807ce4Svictorle 20361b807ce4Svictorle .keywords: dense, matrix, LAPACK, BLAS 20371b807ce4Svictorle 2038284134d9SBarry Smith .seealso: MatCreate(), MatCreateSeqDense(), MatSeqDenseSetPreallocation(), MatSetMaximumSize() 2039867c911aSBarry Smith 20401b807ce4Svictorle @*/ 2041be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatSeqDenseSetLDA(Mat B,PetscInt lda) 20421b807ce4Svictorle { 20431b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 204421a2c019SBarry Smith 20451b807ce4Svictorle PetscFunctionBegin; 2046e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 20471b807ce4Svictorle b->lda = lda; 204821a2c019SBarry Smith b->changelda = PETSC_FALSE; 204921a2c019SBarry Smith b->Mmax = PetscMax(b->Mmax,lda); 20501b807ce4Svictorle PetscFunctionReturn(0); 20511b807ce4Svictorle } 20521b807ce4Svictorle 20530bad9183SKris Buschelman /*MC 2054fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 20550bad9183SKris Buschelman 20560bad9183SKris Buschelman Options Database Keys: 20570bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 20580bad9183SKris Buschelman 20590bad9183SKris Buschelman Level: beginner 20600bad9183SKris Buschelman 206189665df3SBarry Smith .seealso: MatCreateSeqDense() 206289665df3SBarry Smith 20630bad9183SKris Buschelman M*/ 20640bad9183SKris Buschelman 2065273d9f13SBarry Smith EXTERN_C_BEGIN 20664a2ae208SSatish Balay #undef __FUNCT__ 20674a2ae208SSatish Balay #define __FUNCT__ "MatCreate_SeqDense" 2068be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatCreate_SeqDense(Mat B) 2069273d9f13SBarry Smith { 2070273d9f13SBarry Smith Mat_SeqDense *b; 2071dfbe8321SBarry Smith PetscErrorCode ierr; 20727c334f02SBarry Smith PetscMPIInt size; 2073273d9f13SBarry Smith 2074273d9f13SBarry Smith PetscFunctionBegin; 20757adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)B)->comm,&size);CHKERRQ(ierr); 2076e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 207755659b69SBarry Smith 207838f2d2fdSLisandro Dalcin ierr = PetscNewLog(B,Mat_SeqDense,&b);CHKERRQ(ierr); 2079549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 208090f02eecSBarry Smith B->mapping = 0; 208144cd7ae7SLois Curfman McInnes B->data = (void*)b; 208218f449edSLois Curfman McInnes 208344cd7ae7SLois Curfman McInnes b->pivots = 0; 2084273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 2085273d9f13SBarry Smith b->v = 0; 208621a2c019SBarry Smith b->changelda = PETSC_FALSE; 20874e220ebcSLois Curfman McInnes 2088b24902e0SBarry Smith 2089ec1065edSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatGetFactor_petsc_C", 2090b24902e0SBarry Smith "MatGetFactor_seqdense_petsc", 2091b24902e0SBarry Smith MatGetFactor_seqdense_petsc);CHKERRQ(ierr); 2092a23d5eceSKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatSeqDenseSetPreallocation_C", 2093a23d5eceSKris Buschelman "MatSeqDenseSetPreallocation_SeqDense", 2094a23d5eceSKris Buschelman MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 20954ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMult_seqaij_seqdense_C", 20964ae313f4SHong Zhang "MatMatMult_SeqAIJ_SeqDense", 20974ae313f4SHong Zhang MatMatMult_SeqAIJ_SeqDense);CHKERRQ(ierr); 20984ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultSymbolic_seqaij_seqdense_C", 20994ae313f4SHong Zhang "MatMatMultSymbolic_SeqAIJ_SeqDense", 21004ae313f4SHong Zhang MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 21014ae313f4SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMatMultNumeric_seqaij_seqdense_C", 21024ae313f4SHong Zhang "MatMatMultNumeric_SeqAIJ_SeqDense", 21034ae313f4SHong Zhang MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 210417667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 21053a40ed3dSBarry Smith PetscFunctionReturn(0); 2106289bc588SBarry Smith } 2107273d9f13SBarry Smith EXTERN_C_END 2108