1be1d678aSKris Buschelman 267e560aaSBarry Smith /* 367e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 467e560aaSBarry Smith */ 5289bc588SBarry Smith 6dec5eb66SMatthew G Knepley #include <../src/mat/impls/dense/seq/dense.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8289bc588SBarry Smith 96a63e612SBarry Smith #include <../src/mat/impls/aij/seq/aij.h> 10b2573a8aSBarry Smith 11ca15aa20SStefano Zampini PetscErrorCode MatSeqDenseSymmetrize_Private(Mat A, PetscBool hermitian) 128c178816SStefano Zampini { 138c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 148c178816SStefano Zampini PetscInt j, k, n = A->rmap->n; 15ca15aa20SStefano Zampini PetscScalar *v; 16ca15aa20SStefano Zampini PetscErrorCode ierr; 178c178816SStefano Zampini 188c178816SStefano Zampini PetscFunctionBegin; 198c178816SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot symmetrize a rectangular matrix"); 20ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 218c178816SStefano Zampini if (!hermitian) { 228c178816SStefano Zampini for (k=0;k<n;k++) { 238c178816SStefano Zampini for (j=k;j<n;j++) { 24ca15aa20SStefano Zampini v[j*mat->lda + k] = v[k*mat->lda + j]; 258c178816SStefano Zampini } 268c178816SStefano Zampini } 278c178816SStefano Zampini } else { 288c178816SStefano Zampini for (k=0;k<n;k++) { 298c178816SStefano Zampini for (j=k;j<n;j++) { 30ca15aa20SStefano Zampini v[j*mat->lda + k] = PetscConj(v[k*mat->lda + j]); 318c178816SStefano Zampini } 328c178816SStefano Zampini } 338c178816SStefano Zampini } 34ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 358c178816SStefano Zampini PetscFunctionReturn(0); 368c178816SStefano Zampini } 378c178816SStefano Zampini 3805709791SSatish Balay PETSC_EXTERN PetscErrorCode MatSeqDenseInvertFactors_Private(Mat A) 398c178816SStefano Zampini { 408c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 418c178816SStefano Zampini PetscErrorCode ierr; 428c178816SStefano Zampini PetscBLASInt info,n; 438c178816SStefano Zampini 448c178816SStefano Zampini PetscFunctionBegin; 458c178816SStefano Zampini if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 468c178816SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 478c178816SStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 488c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 498c178816SStefano Zampini if (!mat->fwork) { 508c178816SStefano Zampini mat->lfwork = n; 518c178816SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 528c178816SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 538c178816SStefano Zampini } 5400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 558c178816SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 5600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 588c178816SStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 598c178816SStefano Zampini if (A->spd) { 6000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 618c178816SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_("L",&n,mat->v,&mat->lda,&info)); 6200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 638c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 648c178816SStefano Zampini #if defined(PETSC_USE_COMPLEX) 658c178816SStefano Zampini } else if (A->hermitian) { 668c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 678c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 6800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 698c178816SStefano Zampini PetscStackCallBLAS("LAPACKhetri",LAPACKhetri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 718c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 728c178816SStefano Zampini #endif 738c178816SStefano Zampini } else { /* symmetric case */ 748c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 758c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 7600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 778c178816SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 798c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_FALSE);CHKERRQ(ierr); 808c178816SStefano Zampini } 818c178816SStefano Zampini if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad Inversion: zero pivot in row %D",(PetscInt)info-1); 82ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 838c178816SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 848c178816SStefano Zampini 858c178816SStefano Zampini A->ops->solve = NULL; 868c178816SStefano Zampini A->ops->matsolve = NULL; 878c178816SStefano Zampini A->ops->solvetranspose = NULL; 888c178816SStefano Zampini A->ops->matsolvetranspose = NULL; 898c178816SStefano Zampini A->ops->solveadd = NULL; 908c178816SStefano Zampini A->ops->solvetransposeadd = NULL; 918c178816SStefano Zampini A->factortype = MAT_FACTOR_NONE; 928c178816SStefano Zampini ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 938c178816SStefano Zampini PetscFunctionReturn(0); 948c178816SStefano Zampini } 958c178816SStefano Zampini 963f49a652SStefano Zampini PetscErrorCode MatZeroRowsColumns_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 973f49a652SStefano Zampini { 983f49a652SStefano Zampini PetscErrorCode ierr; 993f49a652SStefano Zampini Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1003f49a652SStefano Zampini PetscInt m = l->lda, n = A->cmap->n,r = A->rmap->n, i,j; 101ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 1023f49a652SStefano Zampini const PetscScalar *xx; 1033f49a652SStefano Zampini 1043f49a652SStefano Zampini PetscFunctionBegin; 10576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1063f49a652SStefano Zampini for (i=0; i<N; i++) { 1073f49a652SStefano Zampini if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1083f49a652SStefano Zampini if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1093f49a652SStefano Zampini if (rows[i] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Col %D requested to be zeroed greater than or equal number of cols %D",rows[i],A->cmap->n); 1103f49a652SStefano Zampini } 11176bd3646SJed Brown } 112ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1133f49a652SStefano Zampini 1143f49a652SStefano Zampini /* fix right hand side if needed */ 1153f49a652SStefano Zampini if (x && b) { 1166c4d906cSStefano Zampini Vec xt; 1176c4d906cSStefano Zampini 1186c4d906cSStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1196c4d906cSStefano Zampini ierr = VecDuplicate(x,&xt);CHKERRQ(ierr); 1206c4d906cSStefano Zampini ierr = VecCopy(x,xt);CHKERRQ(ierr); 1216c4d906cSStefano Zampini ierr = VecScale(xt,-1.0);CHKERRQ(ierr); 1226c4d906cSStefano Zampini ierr = MatMultAdd(A,xt,b,b);CHKERRQ(ierr); 1236c4d906cSStefano Zampini ierr = VecDestroy(&xt);CHKERRQ(ierr); 1243f49a652SStefano Zampini ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 1253f49a652SStefano Zampini ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 1263f49a652SStefano Zampini for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 1273f49a652SStefano Zampini ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 1283f49a652SStefano Zampini ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 1293f49a652SStefano Zampini } 1303f49a652SStefano Zampini 131ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1323f49a652SStefano Zampini for (i=0; i<N; i++) { 133ca15aa20SStefano Zampini slot = v + rows[i]*m; 134580bdb30SBarry Smith ierr = PetscArrayzero(slot,r);CHKERRQ(ierr); 1353f49a652SStefano Zampini } 1363f49a652SStefano Zampini for (i=0; i<N; i++) { 137ca15aa20SStefano Zampini slot = v + rows[i]; 1383f49a652SStefano Zampini for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 1393f49a652SStefano Zampini } 1403f49a652SStefano Zampini if (diag != 0.0) { 1413f49a652SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1423f49a652SStefano Zampini for (i=0; i<N; i++) { 143ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1443f49a652SStefano Zampini *slot = diag; 1453f49a652SStefano Zampini } 1463f49a652SStefano Zampini } 147ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 1483f49a652SStefano Zampini PetscFunctionReturn(0); 1493f49a652SStefano Zampini } 1503f49a652SStefano Zampini 151abc3b08eSStefano Zampini PetscErrorCode MatPtAPNumeric_SeqDense_SeqDense(Mat A,Mat P,Mat C) 152abc3b08eSStefano Zampini { 153abc3b08eSStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)(C->data); 154abc3b08eSStefano Zampini PetscErrorCode ierr; 155abc3b08eSStefano Zampini 156abc3b08eSStefano Zampini PetscFunctionBegin; 157ca15aa20SStefano Zampini if (c->ptapwork) { 158ca15aa20SStefano Zampini ierr = (*C->ops->matmultnumeric)(A,P,c->ptapwork);CHKERRQ(ierr); 159ca15aa20SStefano Zampini ierr = (*C->ops->transposematmultnumeric)(P,c->ptapwork,C);CHKERRQ(ierr); 1604222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"Must call MatPtAPSymbolic_SeqDense_SeqDense() first"); 161abc3b08eSStefano Zampini PetscFunctionReturn(0); 162abc3b08eSStefano Zampini } 163abc3b08eSStefano Zampini 1644222ddf1SHong Zhang PetscErrorCode MatPtAPSymbolic_SeqDense_SeqDense(Mat A,Mat P,PetscReal fill,Mat C) 165abc3b08eSStefano Zampini { 166abc3b08eSStefano Zampini Mat_SeqDense *c; 1677a3c3d58SStefano Zampini PetscBool cisdense; 168abc3b08eSStefano Zampini PetscErrorCode ierr; 169abc3b08eSStefano Zampini 170abc3b08eSStefano Zampini PetscFunctionBegin; 1714222ddf1SHong Zhang ierr = MatSetSizes(C,P->cmap->n,P->cmap->n,P->cmap->N,P->cmap->N);CHKERRQ(ierr); 1727a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 1737a3c3d58SStefano Zampini if (!cisdense) { 1747a3c3d58SStefano Zampini PetscBool flg; 1757a3c3d58SStefano Zampini 1767a3c3d58SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)P,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 1774222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 1787a3c3d58SStefano Zampini } 1797a3c3d58SStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 1804222ddf1SHong Zhang c = (Mat_SeqDense*)C->data; 181ca15aa20SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&c->ptapwork);CHKERRQ(ierr); 182ca15aa20SStefano Zampini ierr = MatSetSizes(c->ptapwork,A->rmap->n,P->cmap->n,A->rmap->N,P->cmap->N);CHKERRQ(ierr); 1837a3c3d58SStefano Zampini ierr = MatSetType(c->ptapwork,((PetscObject)C)->type_name);CHKERRQ(ierr); 1847a3c3d58SStefano Zampini ierr = MatSetUp(c->ptapwork);CHKERRQ(ierr); 185abc3b08eSStefano Zampini PetscFunctionReturn(0); 186abc3b08eSStefano Zampini } 187abc3b08eSStefano Zampini 188cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 189b49cda9fSStefano Zampini { 190a13144ffSStefano Zampini Mat B = NULL; 191b49cda9fSStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 192b49cda9fSStefano Zampini Mat_SeqDense *b; 193b49cda9fSStefano Zampini PetscErrorCode ierr; 194b49cda9fSStefano Zampini PetscInt *ai=a->i,*aj=a->j,m=A->rmap->N,n=A->cmap->N,i; 195b49cda9fSStefano Zampini MatScalar *av=a->a; 196a13144ffSStefano Zampini PetscBool isseqdense; 197b49cda9fSStefano Zampini 198b49cda9fSStefano Zampini PetscFunctionBegin; 199a13144ffSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 200a13144ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*newmat,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 201a32993e3SJed Brown if (!isseqdense) SETERRQ1(PetscObjectComm((PetscObject)*newmat),PETSC_ERR_USER,"Cannot reuse matrix of type %s",((PetscObject)(*newmat))->type_name); 202a13144ffSStefano Zampini } 203a13144ffSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 204b49cda9fSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 205b49cda9fSStefano Zampini ierr = MatSetSizes(B,m,n,m,n);CHKERRQ(ierr); 206b49cda9fSStefano Zampini ierr = MatSetType(B,MATSEQDENSE);CHKERRQ(ierr); 207b49cda9fSStefano Zampini ierr = MatSeqDenseSetPreallocation(B,NULL);CHKERRQ(ierr); 208b49cda9fSStefano Zampini b = (Mat_SeqDense*)(B->data); 209a13144ffSStefano Zampini } else { 210a13144ffSStefano Zampini b = (Mat_SeqDense*)((*newmat)->data); 211580bdb30SBarry Smith ierr = PetscArrayzero(b->v,m*n);CHKERRQ(ierr); 212a13144ffSStefano Zampini } 213b49cda9fSStefano Zampini for (i=0; i<m; i++) { 214b49cda9fSStefano Zampini PetscInt j; 215b49cda9fSStefano Zampini for (j=0;j<ai[1]-ai[0];j++) { 216b49cda9fSStefano Zampini b->v[*aj*m+i] = *av; 217b49cda9fSStefano Zampini aj++; 218b49cda9fSStefano Zampini av++; 219b49cda9fSStefano Zampini } 220b49cda9fSStefano Zampini ai++; 221b49cda9fSStefano Zampini } 222b49cda9fSStefano Zampini 223511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 224a13144ffSStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 225a13144ffSStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 227b49cda9fSStefano Zampini } else { 228a13144ffSStefano Zampini if (B) *newmat = B; 229a13144ffSStefano Zampini ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 230a13144ffSStefano Zampini ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 231b49cda9fSStefano Zampini } 232b49cda9fSStefano Zampini PetscFunctionReturn(0); 233b49cda9fSStefano Zampini } 234b49cda9fSStefano Zampini 235cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqAIJ(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 2366a63e612SBarry Smith { 2376a63e612SBarry Smith Mat B; 2386a63e612SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2396a63e612SBarry Smith PetscErrorCode ierr; 2409399e1b8SMatthew G. Knepley PetscInt i, j; 2419399e1b8SMatthew G. Knepley PetscInt *rows, *nnz; 2429399e1b8SMatthew G. Knepley MatScalar *aa = a->v, *vals; 2436a63e612SBarry Smith 2446a63e612SBarry Smith PetscFunctionBegin; 245ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 2466a63e612SBarry Smith ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2476a63e612SBarry Smith ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 2489399e1b8SMatthew G. Knepley ierr = PetscCalloc3(A->rmap->n,&rows,A->rmap->n,&nnz,A->rmap->n,&vals);CHKERRQ(ierr); 2499399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2509399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) ++nnz[i]; 2516a63e612SBarry Smith aa += a->lda; 2526a63e612SBarry Smith } 2539399e1b8SMatthew G. Knepley ierr = MatSeqAIJSetPreallocation(B,PETSC_DETERMINE,nnz);CHKERRQ(ierr); 2549399e1b8SMatthew G. Knepley aa = a->v; 2559399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2569399e1b8SMatthew G. Knepley PetscInt numRows = 0; 2579399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) {rows[numRows] = i; vals[numRows++] = aa[i];} 2589399e1b8SMatthew G. Knepley ierr = MatSetValues(B,numRows,rows,1,&j,vals,INSERT_VALUES);CHKERRQ(ierr); 2599399e1b8SMatthew G. Knepley aa += a->lda; 2609399e1b8SMatthew G. Knepley } 2619399e1b8SMatthew G. Knepley ierr = PetscFree3(rows,nnz,vals);CHKERRQ(ierr); 2626a63e612SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2636a63e612SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2646a63e612SBarry Smith 265511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 26628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 2676a63e612SBarry Smith } else { 2686a63e612SBarry Smith *newmat = B; 2696a63e612SBarry Smith } 2706a63e612SBarry Smith PetscFunctionReturn(0); 2716a63e612SBarry Smith } 2726a63e612SBarry Smith 273ca15aa20SStefano Zampini PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 2741987afe7SBarry Smith { 2751987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 276ca15aa20SStefano Zampini const PetscScalar *xv; 277ca15aa20SStefano Zampini PetscScalar *yv; 2780805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 279efee365bSSatish Balay PetscErrorCode ierr; 2803a40ed3dSBarry Smith 2813a40ed3dSBarry Smith PetscFunctionBegin; 282ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(X,&xv);CHKERRQ(ierr); 283ca15aa20SStefano Zampini ierr = MatDenseGetArray(Y,&yv);CHKERRQ(ierr); 284c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n*X->cmap->n,&N);CHKERRQ(ierr); 285c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n,&m);CHKERRQ(ierr); 286c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->lda,&ldax);CHKERRQ(ierr); 287c5df96a5SBarry Smith ierr = PetscBLASIntCast(y->lda,&lday);CHKERRQ(ierr); 288a5ce6ee0Svictorle if (ldax>m || lday>m) { 289ca15aa20SStefano Zampini PetscInt j; 290ca15aa20SStefano Zampini 291d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 292ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&m,&alpha,xv+j*ldax,&one,yv+j*lday,&one)); 293a5ce6ee0Svictorle } 294a5ce6ee0Svictorle } else { 295ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&N,&alpha,xv,&one,yv,&one)); 296a5ce6ee0Svictorle } 297ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(X,&xv);CHKERRQ(ierr); 298ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(Y,&yv);CHKERRQ(ierr); 2990450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 3003a40ed3dSBarry Smith PetscFunctionReturn(0); 3011987afe7SBarry Smith } 3021987afe7SBarry Smith 303e0877f53SBarry Smith static PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 304289bc588SBarry Smith { 305ca15aa20SStefano Zampini PetscLogDouble N = A->rmap->n*A->cmap->n; 3063a40ed3dSBarry Smith 3073a40ed3dSBarry Smith PetscFunctionBegin; 3084e220ebcSLois Curfman McInnes info->block_size = 1.0; 309ca15aa20SStefano Zampini info->nz_allocated = N; 310ca15aa20SStefano Zampini info->nz_used = N; 311ca15aa20SStefano Zampini info->nz_unneeded = 0; 312ca15aa20SStefano Zampini info->assemblies = A->num_ass; 3134e220ebcSLois Curfman McInnes info->mallocs = 0; 3147adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 3154e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 3164e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 3174e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 3183a40ed3dSBarry Smith PetscFunctionReturn(0); 319289bc588SBarry Smith } 320289bc588SBarry Smith 321637a0070SStefano Zampini PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 32280cd9d93SLois Curfman McInnes { 323273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 324ca15aa20SStefano Zampini PetscScalar *v; 325efee365bSSatish Balay PetscErrorCode ierr; 326c5df96a5SBarry Smith PetscBLASInt one = 1,j,nz,lda; 32780cd9d93SLois Curfman McInnes 3283a40ed3dSBarry Smith PetscFunctionBegin; 329ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 330c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->lda,&lda);CHKERRQ(ierr); 331d0f46423SBarry Smith if (lda>A->rmap->n) { 332c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&nz);CHKERRQ(ierr); 333d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 334ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v+j*lda,&one)); 335a5ce6ee0Svictorle } 336a5ce6ee0Svictorle } else { 337c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n*A->cmap->n,&nz);CHKERRQ(ierr); 338ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v,&one)); 339a5ce6ee0Svictorle } 340efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 341ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 3423a40ed3dSBarry Smith PetscFunctionReturn(0); 34380cd9d93SLois Curfman McInnes } 34480cd9d93SLois Curfman McInnes 345e0877f53SBarry Smith static PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 3461cbb95d3SBarry Smith { 3471cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 348ca15aa20SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 349ca15aa20SStefano Zampini const PetscScalar *v; 350ca15aa20SStefano Zampini PetscErrorCode ierr; 3511cbb95d3SBarry Smith 3521cbb95d3SBarry Smith PetscFunctionBegin; 3531cbb95d3SBarry Smith *fl = PETSC_FALSE; 354d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 355ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 3561cbb95d3SBarry Smith for (i=0; i<m; i++) { 357ca15aa20SStefano Zampini for (j=i; j<m; j++) { 358637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) { 359637a0070SStefano Zampini goto restore; 3601cbb95d3SBarry Smith } 3611cbb95d3SBarry Smith } 362637a0070SStefano Zampini } 3631cbb95d3SBarry Smith *fl = PETSC_TRUE; 364637a0070SStefano Zampini restore: 365637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 366637a0070SStefano Zampini PetscFunctionReturn(0); 367637a0070SStefano Zampini } 368637a0070SStefano Zampini 369637a0070SStefano Zampini static PetscErrorCode MatIsSymmetric_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 370637a0070SStefano Zampini { 371637a0070SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 372637a0070SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 373637a0070SStefano Zampini const PetscScalar *v; 374637a0070SStefano Zampini PetscErrorCode ierr; 375637a0070SStefano Zampini 376637a0070SStefano Zampini PetscFunctionBegin; 377637a0070SStefano Zampini *fl = PETSC_FALSE; 378637a0070SStefano Zampini if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 379637a0070SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 380637a0070SStefano Zampini for (i=0; i<m; i++) { 381637a0070SStefano Zampini for (j=i; j<m; j++) { 382637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - v[j+i*N]) > rtol) { 383637a0070SStefano Zampini goto restore; 384637a0070SStefano Zampini } 385637a0070SStefano Zampini } 386637a0070SStefano Zampini } 387637a0070SStefano Zampini *fl = PETSC_TRUE; 388637a0070SStefano Zampini restore: 389637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 3901cbb95d3SBarry Smith PetscFunctionReturn(0); 3911cbb95d3SBarry Smith } 3921cbb95d3SBarry Smith 393ca15aa20SStefano Zampini PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 394b24902e0SBarry Smith { 395ca15aa20SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 396b24902e0SBarry Smith PetscErrorCode ierr; 39723fc5dcaSStefano Zampini PetscInt lda = (PetscInt)mat->lda,j,m,nlda = lda; 398b24902e0SBarry Smith 399b24902e0SBarry Smith PetscFunctionBegin; 400aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&newi->rmap);CHKERRQ(ierr); 401aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&newi->cmap);CHKERRQ(ierr); 40223fc5dcaSStefano Zampini if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { /* propagate LDA */ 40323fc5dcaSStefano Zampini ierr = MatDenseSetLDA(newi,lda);CHKERRQ(ierr); 40423fc5dcaSStefano Zampini } 4050298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,NULL);CHKERRQ(ierr); 406b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 407ca15aa20SStefano Zampini const PetscScalar *av; 408ca15aa20SStefano Zampini PetscScalar *v; 409ca15aa20SStefano Zampini 410ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 411ca15aa20SStefano Zampini ierr = MatDenseGetArray(newi,&v);CHKERRQ(ierr); 41223fc5dcaSStefano Zampini ierr = MatDenseGetLDA(newi,&nlda);CHKERRQ(ierr); 413d0f46423SBarry Smith m = A->rmap->n; 41423fc5dcaSStefano Zampini if (lda>m || nlda>m) { 415d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 41623fc5dcaSStefano Zampini ierr = PetscArraycpy(v+j*nlda,av+j*lda,m);CHKERRQ(ierr); 417b24902e0SBarry Smith } 418b24902e0SBarry Smith } else { 419ca15aa20SStefano Zampini ierr = PetscArraycpy(v,av,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 420b24902e0SBarry Smith } 421ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newi,&v);CHKERRQ(ierr); 422ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 423b24902e0SBarry Smith } 424b24902e0SBarry Smith PetscFunctionReturn(0); 425b24902e0SBarry Smith } 426b24902e0SBarry Smith 427ca15aa20SStefano Zampini PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 42802cad45dSBarry Smith { 4296849ba73SBarry Smith PetscErrorCode ierr; 43002cad45dSBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 432ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),newmat);CHKERRQ(ierr); 433d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4345c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 435719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 436b24902e0SBarry Smith PetscFunctionReturn(0); 437b24902e0SBarry Smith } 438b24902e0SBarry Smith 439e0877f53SBarry Smith static PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 440289bc588SBarry Smith { 4414482741eSBarry Smith MatFactorInfo info; 442a093e273SMatthew Knepley PetscErrorCode ierr; 4433a40ed3dSBarry Smith 4443a40ed3dSBarry Smith PetscFunctionBegin; 445c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 446ca15aa20SStefano Zampini ierr = (*fact->ops->lufactor)(fact,0,0,&info);CHKERRQ(ierr); 4473a40ed3dSBarry Smith PetscFunctionReturn(0); 448289bc588SBarry Smith } 4496ee01492SSatish Balay 450e0877f53SBarry Smith static PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 451289bc588SBarry Smith { 452c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 4536849ba73SBarry Smith PetscErrorCode ierr; 454f1ceaac6SMatthew G. Knepley const PetscScalar *x; 455f1ceaac6SMatthew G. Knepley PetscScalar *y; 456c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 45767e560aaSBarry Smith 4583a40ed3dSBarry Smith PetscFunctionBegin; 459c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 460f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 4611ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 462580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 463d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 46400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4658b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 46600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 467e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 468d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 469a49dc2a2SStefano Zampini if (A->spd) { 47000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4718b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 47200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 473e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 474a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 475a49dc2a2SStefano Zampini } else if (A->hermitian) { 47600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 477a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 47800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 479a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 480a49dc2a2SStefano Zampini #endif 481a49dc2a2SStefano Zampini } else { /* symmetric case */ 48200121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 483a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 48400121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 485a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 486a49dc2a2SStefano Zampini } 4872205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 488f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 4891ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 490dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 4913a40ed3dSBarry Smith PetscFunctionReturn(0); 492289bc588SBarry Smith } 4936ee01492SSatish Balay 494e0877f53SBarry Smith static PetscErrorCode MatMatSolve_SeqDense(Mat A,Mat B,Mat X) 49585e2c93fSHong Zhang { 49685e2c93fSHong Zhang Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 49785e2c93fSHong Zhang PetscErrorCode ierr; 4981683a169SBarry Smith const PetscScalar *b; 4991683a169SBarry Smith PetscScalar *x; 500efb80c78SLisandro Dalcin PetscInt n; 501783b601eSJed Brown PetscBLASInt nrhs,info,m; 50285e2c93fSHong Zhang 50385e2c93fSHong Zhang PetscFunctionBegin; 504c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 5050298fd71SBarry Smith ierr = MatGetSize(B,NULL,&n);CHKERRQ(ierr); 506c5df96a5SBarry Smith ierr = PetscBLASIntCast(n,&nrhs);CHKERRQ(ierr); 5071683a169SBarry Smith ierr = MatDenseGetArrayRead(B,&b);CHKERRQ(ierr); 5088c778c55SBarry Smith ierr = MatDenseGetArray(X,&x);CHKERRQ(ierr); 50985e2c93fSHong Zhang 510580bdb30SBarry Smith ierr = PetscArraycpy(x,b,m*nrhs);CHKERRQ(ierr); 51185e2c93fSHong Zhang 51285e2c93fSHong Zhang if (A->factortype == MAT_FACTOR_LU) { 51300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5148b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 51500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 51685e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 51785e2c93fSHong Zhang } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 518a49dc2a2SStefano Zampini if (A->spd) { 51900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5208b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&nrhs,mat->v,&mat->lda,x,&m,&info)); 52100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 52285e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 523a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 524a49dc2a2SStefano Zampini } else if (A->hermitian) { 52500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 526a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 52700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 528a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 529a49dc2a2SStefano Zampini #endif 530a49dc2a2SStefano Zampini } else { /* symmetric case */ 53100121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 532a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 53300121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 534a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 535a49dc2a2SStefano Zampini } 5362205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 53785e2c93fSHong Zhang 5381683a169SBarry Smith ierr = MatDenseRestoreArrayRead(B,&b);CHKERRQ(ierr); 5398c778c55SBarry Smith ierr = MatDenseRestoreArray(X,&x);CHKERRQ(ierr); 54085e2c93fSHong Zhang ierr = PetscLogFlops(nrhs*(2.0*m*m - m));CHKERRQ(ierr); 54185e2c93fSHong Zhang PetscFunctionReturn(0); 54285e2c93fSHong Zhang } 54385e2c93fSHong Zhang 54400121966SStefano Zampini static PetscErrorCode MatConjugate_SeqDense(Mat); 54500121966SStefano Zampini 546e0877f53SBarry Smith static PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 547da3a660dSBarry Smith { 548c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 549dfbe8321SBarry Smith PetscErrorCode ierr; 550f1ceaac6SMatthew G. Knepley const PetscScalar *x; 551f1ceaac6SMatthew G. Knepley PetscScalar *y; 552c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 55367e560aaSBarry Smith 5543a40ed3dSBarry Smith PetscFunctionBegin; 555c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 556f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 5571ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 558580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 5598208b9aeSStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 56000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5618b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 56200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 563e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 5648208b9aeSStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 565a49dc2a2SStefano Zampini if (A->spd) { 56600121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 56700121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 56800121966SStefano Zampini #endif 56900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5708b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 57100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57200121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 57300121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57400121966SStefano Zampini #endif 575a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 576a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 577a49dc2a2SStefano Zampini } else if (A->hermitian) { 57800121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 58000121966SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 58200121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 583ae7cfcebSSatish Balay #endif 584a49dc2a2SStefano Zampini } else { /* symmetric case */ 58500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 586a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 588a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 589da3a660dSBarry Smith } 590a49dc2a2SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 591f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 5921ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 593dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 5943a40ed3dSBarry Smith PetscFunctionReturn(0); 595da3a660dSBarry Smith } 5966ee01492SSatish Balay 597db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 598db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 599db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 600ca15aa20SStefano Zampini PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 601db4efbfdSBarry Smith { 602db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 603db4efbfdSBarry Smith PetscErrorCode ierr; 604db4efbfdSBarry Smith PetscBLASInt n,m,info; 605db4efbfdSBarry Smith 606db4efbfdSBarry Smith PetscFunctionBegin; 607c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 608c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 609db4efbfdSBarry Smith if (!mat->pivots) { 6108208b9aeSStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 6113bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 612db4efbfdSBarry Smith } 613db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 6148e57ea43SSatish Balay ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6158b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info)); 6168e57ea43SSatish Balay ierr = PetscFPTrapPop();CHKERRQ(ierr); 6178e57ea43SSatish Balay 618e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 619e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 6208208b9aeSStefano Zampini 621db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6228208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 623db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 624d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 625db4efbfdSBarry Smith 626f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 627f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 628f6224b95SHong Zhang 629dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 630db4efbfdSBarry Smith PetscFunctionReturn(0); 631db4efbfdSBarry Smith } 632db4efbfdSBarry Smith 633a49dc2a2SStefano Zampini /* Cholesky as L*L^T or L*D*L^T and the symmetric/hermitian complex variants */ 634ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 635db4efbfdSBarry Smith { 636db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 637db4efbfdSBarry Smith PetscErrorCode ierr; 638c5df96a5SBarry Smith PetscBLASInt info,n; 639db4efbfdSBarry Smith 640db4efbfdSBarry Smith PetscFunctionBegin; 641c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 642db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 643a49dc2a2SStefano Zampini if (A->spd) { 64400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6458b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info)); 64600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 647a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 648a49dc2a2SStefano Zampini } else if (A->hermitian) { 649a49dc2a2SStefano Zampini if (!mat->pivots) { 650a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 651a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 652a49dc2a2SStefano Zampini } 653a49dc2a2SStefano Zampini if (!mat->fwork) { 654a49dc2a2SStefano Zampini PetscScalar dummy; 655a49dc2a2SStefano Zampini 656a49dc2a2SStefano Zampini mat->lfwork = -1; 65700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 658a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 65900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 660a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 661a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 662a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 663a49dc2a2SStefano Zampini } 66400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 665a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 66600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 667a49dc2a2SStefano Zampini #endif 668a49dc2a2SStefano Zampini } else { /* symmetric case */ 669a49dc2a2SStefano Zampini if (!mat->pivots) { 670a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 671a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 672a49dc2a2SStefano Zampini } 673a49dc2a2SStefano Zampini if (!mat->fwork) { 674a49dc2a2SStefano Zampini PetscScalar dummy; 675a49dc2a2SStefano Zampini 676a49dc2a2SStefano Zampini mat->lfwork = -1; 67700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 678a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 67900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 680a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 681a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 682a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 683a49dc2a2SStefano Zampini } 68400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 685a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 68600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 687a49dc2a2SStefano Zampini } 688e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 6898208b9aeSStefano Zampini 690db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6918208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 692db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 693d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 6942205254eSKarl Rupp 695f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 696f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 697f6224b95SHong Zhang 698eb3f19e4SBarry Smith ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 699db4efbfdSBarry Smith PetscFunctionReturn(0); 700db4efbfdSBarry Smith } 701db4efbfdSBarry Smith 7020481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 703db4efbfdSBarry Smith { 704db4efbfdSBarry Smith PetscErrorCode ierr; 705db4efbfdSBarry Smith MatFactorInfo info; 706db4efbfdSBarry Smith 707db4efbfdSBarry Smith PetscFunctionBegin; 708db4efbfdSBarry Smith info.fill = 1.0; 7092205254eSKarl Rupp 710c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 711ca15aa20SStefano Zampini ierr = (*fact->ops->choleskyfactor)(fact,0,&info);CHKERRQ(ierr); 712db4efbfdSBarry Smith PetscFunctionReturn(0); 713db4efbfdSBarry Smith } 714db4efbfdSBarry Smith 715ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 716db4efbfdSBarry Smith { 717db4efbfdSBarry Smith PetscFunctionBegin; 718c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 7191bbcc794SSatish Balay fact->preallocated = PETSC_TRUE; 720719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 721bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 722bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 723bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 724db4efbfdSBarry Smith PetscFunctionReturn(0); 725db4efbfdSBarry Smith } 726db4efbfdSBarry Smith 727ca15aa20SStefano Zampini PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 728db4efbfdSBarry Smith { 729db4efbfdSBarry Smith PetscFunctionBegin; 730b66fe19dSMatthew G Knepley fact->preallocated = PETSC_TRUE; 731c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 732719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 733bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 734bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 735bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 736db4efbfdSBarry Smith PetscFunctionReturn(0); 737db4efbfdSBarry Smith } 738db4efbfdSBarry Smith 739ca15aa20SStefano Zampini /* uses LAPACK */ 740cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 741db4efbfdSBarry Smith { 742db4efbfdSBarry Smith PetscErrorCode ierr; 743db4efbfdSBarry Smith 744db4efbfdSBarry Smith PetscFunctionBegin; 745ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),fact);CHKERRQ(ierr); 746db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 747ca15aa20SStefano Zampini ierr = MatSetType(*fact,MATDENSE);CHKERRQ(ierr); 748db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU) { 749db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 750db4efbfdSBarry Smith } else { 751db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 752db4efbfdSBarry Smith } 753d5f3da31SBarry Smith (*fact)->factortype = ftype; 75400c67f3bSHong Zhang 75500c67f3bSHong Zhang ierr = PetscFree((*fact)->solvertype);CHKERRQ(ierr); 75600c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&(*fact)->solvertype);CHKERRQ(ierr); 757db4efbfdSBarry Smith PetscFunctionReturn(0); 758db4efbfdSBarry Smith } 759db4efbfdSBarry Smith 760289bc588SBarry Smith /* ------------------------------------------------------------------*/ 761e0877f53SBarry Smith static PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 762289bc588SBarry Smith { 763c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 764d9ca1df4SBarry Smith PetscScalar *x,*v = mat->v,zero = 0.0,xt; 765d9ca1df4SBarry Smith const PetscScalar *b; 766dfbe8321SBarry Smith PetscErrorCode ierr; 767d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 768c5df96a5SBarry Smith PetscBLASInt o = 1,bm; 769289bc588SBarry Smith 7703a40ed3dSBarry Smith PetscFunctionBegin; 771ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 772c70f7ee4SJunchao Zhang if (A->offloadmask == PETSC_OFFLOAD_GPU) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 773ca15aa20SStefano Zampini #endif 774422a814eSBarry Smith if (shift == -1) shift = 0.0; /* negative shift indicates do not error on zero diagonal; this code never zeros on zero diagonal */ 775c5df96a5SBarry Smith ierr = PetscBLASIntCast(m,&bm);CHKERRQ(ierr); 776289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 7773bffc371SBarry Smith /* this is a hack fix, should have another version without the second BLASdotu */ 7782dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 779289bc588SBarry Smith } 7801ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 781d9ca1df4SBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 782b965ef7fSBarry Smith its = its*lits; 783e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 784289bc588SBarry Smith while (its--) { 785fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 786289bc588SBarry Smith for (i=0; i<m; i++) { 7873bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 78855a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 789289bc588SBarry Smith } 790289bc588SBarry Smith } 791fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 792289bc588SBarry Smith for (i=m-1; i>=0; i--) { 7933bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 79455a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 795289bc588SBarry Smith } 796289bc588SBarry Smith } 797289bc588SBarry Smith } 798d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 7991ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 8003a40ed3dSBarry Smith PetscFunctionReturn(0); 801289bc588SBarry Smith } 802289bc588SBarry Smith 803289bc588SBarry Smith /* -----------------------------------------------------------------*/ 804ca15aa20SStefano Zampini PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 805289bc588SBarry Smith { 806c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 807d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 808d9ca1df4SBarry Smith PetscScalar *y; 809dfbe8321SBarry Smith PetscErrorCode ierr; 8100805154bSBarry Smith PetscBLASInt m, n,_One=1; 811ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 8123a40ed3dSBarry Smith 8133a40ed3dSBarry Smith PetscFunctionBegin; 814c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 815c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 816d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8172bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8185ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8195ac36cfcSBarry Smith PetscBLASInt i; 8205ac36cfcSBarry Smith for (i=0; i<n; i++) y[i] = 0.0; 8215ac36cfcSBarry Smith } else { 8228b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One)); 8235ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 8245ac36cfcSBarry Smith } 825d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8262bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8273a40ed3dSBarry Smith PetscFunctionReturn(0); 828289bc588SBarry Smith } 829800995b7SMatthew Knepley 830ca15aa20SStefano Zampini PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 831289bc588SBarry Smith { 832c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 833d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0,_DZero=0.0; 834dfbe8321SBarry Smith PetscErrorCode ierr; 8350805154bSBarry Smith PetscBLASInt m, n, _One=1; 836d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 8373a40ed3dSBarry Smith 8383a40ed3dSBarry Smith PetscFunctionBegin; 839c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 840c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 841d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8422bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8435ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8445ac36cfcSBarry Smith PetscBLASInt i; 8455ac36cfcSBarry Smith for (i=0; i<m; i++) y[i] = 0.0; 8465ac36cfcSBarry Smith } else { 8478b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One)); 8485ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 8495ac36cfcSBarry Smith } 850d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8512bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8523a40ed3dSBarry Smith PetscFunctionReturn(0); 853289bc588SBarry Smith } 8546ee01492SSatish Balay 855ca15aa20SStefano Zampini PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 856289bc588SBarry Smith { 857c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 858d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 859d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0; 860dfbe8321SBarry Smith PetscErrorCode ierr; 8610805154bSBarry Smith PetscBLASInt m, n, _One=1; 8623a40ed3dSBarry Smith 8633a40ed3dSBarry Smith PetscFunctionBegin; 864c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 865c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 866d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 867600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 868d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8691ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8708b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 871d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8721ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 873dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8743a40ed3dSBarry Smith PetscFunctionReturn(0); 875289bc588SBarry Smith } 8766ee01492SSatish Balay 877ca15aa20SStefano Zampini PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 878289bc588SBarry Smith { 879c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 880d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 881d9ca1df4SBarry Smith PetscScalar *y; 882dfbe8321SBarry Smith PetscErrorCode ierr; 8830805154bSBarry Smith PetscBLASInt m, n, _One=1; 88487828ca2SBarry Smith PetscScalar _DOne=1.0; 8853a40ed3dSBarry Smith 8863a40ed3dSBarry Smith PetscFunctionBegin; 887c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 888c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 889d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 890600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 891d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8921ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8938b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 894d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8951ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 896dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8973a40ed3dSBarry Smith PetscFunctionReturn(0); 898289bc588SBarry Smith } 899289bc588SBarry Smith 900289bc588SBarry Smith /* -----------------------------------------------------------------*/ 901e0877f53SBarry Smith static PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 902289bc588SBarry Smith { 903c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 9046849ba73SBarry Smith PetscErrorCode ierr; 90513f74950SBarry Smith PetscInt i; 90667e560aaSBarry Smith 9073a40ed3dSBarry Smith PetscFunctionBegin; 908d0f46423SBarry Smith *ncols = A->cmap->n; 909289bc588SBarry Smith if (cols) { 910854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,cols);CHKERRQ(ierr); 911d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 912289bc588SBarry Smith } 913289bc588SBarry Smith if (vals) { 914ca15aa20SStefano Zampini const PetscScalar *v; 915ca15aa20SStefano Zampini 916ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 917854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,vals);CHKERRQ(ierr); 918ca15aa20SStefano Zampini v += row; 919d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 920ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 921289bc588SBarry Smith } 9223a40ed3dSBarry Smith PetscFunctionReturn(0); 923289bc588SBarry Smith } 9246ee01492SSatish Balay 925e0877f53SBarry Smith static PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 926289bc588SBarry Smith { 927dfbe8321SBarry Smith PetscErrorCode ierr; 9286e111a19SKarl Rupp 929606d414cSSatish Balay PetscFunctionBegin; 930606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 931606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 9323a40ed3dSBarry Smith PetscFunctionReturn(0); 933289bc588SBarry Smith } 934289bc588SBarry Smith /* ----------------------------------------------------------------*/ 935e0877f53SBarry Smith static PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 936289bc588SBarry Smith { 937c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 938ca15aa20SStefano Zampini PetscScalar *av; 93913f74950SBarry Smith PetscInt i,j,idx=0; 940ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 941c70f7ee4SJunchao Zhang PetscOffloadMask oldf; 942ca15aa20SStefano Zampini #endif 943ca15aa20SStefano Zampini PetscErrorCode ierr; 944d6dfbf8fSBarry Smith 9453a40ed3dSBarry Smith PetscFunctionBegin; 946ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&av);CHKERRQ(ierr); 947289bc588SBarry Smith if (!mat->roworiented) { 948dbb450caSBarry Smith if (addv == INSERT_VALUES) { 949289bc588SBarry Smith for (j=0; j<n; j++) { 950cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 951cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 952289bc588SBarry Smith for (i=0; i<m; i++) { 953cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 954cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 955ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 956289bc588SBarry Smith } 957289bc588SBarry Smith } 9583a40ed3dSBarry Smith } else { 959289bc588SBarry Smith for (j=0; j<n; j++) { 960cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 961cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 962289bc588SBarry Smith for (i=0; i<m; i++) { 963cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 964cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 965ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 966289bc588SBarry Smith } 967289bc588SBarry Smith } 968289bc588SBarry Smith } 9693a40ed3dSBarry Smith } else { 970dbb450caSBarry Smith if (addv == INSERT_VALUES) { 971e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 972cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 973cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 974e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 975cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 976cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 977ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 978e8d4e0b9SBarry Smith } 979e8d4e0b9SBarry Smith } 9803a40ed3dSBarry Smith } else { 981289bc588SBarry Smith for (i=0; i<m; i++) { 982cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 983cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 984289bc588SBarry Smith for (j=0; j<n; j++) { 985cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 986cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 987ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 988289bc588SBarry Smith } 989289bc588SBarry Smith } 990289bc588SBarry Smith } 991e8d4e0b9SBarry Smith } 992ca15aa20SStefano Zampini /* hack to prevent unneeded copy to the GPU while returning the array */ 993ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 994c70f7ee4SJunchao Zhang oldf = A->offloadmask; 995c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_GPU; 996ca15aa20SStefano Zampini #endif 997ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&av);CHKERRQ(ierr); 998ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 999c70f7ee4SJunchao Zhang A->offloadmask = (oldf == PETSC_OFFLOAD_UNALLOCATED ? PETSC_OFFLOAD_UNALLOCATED : PETSC_OFFLOAD_CPU); 1000ca15aa20SStefano Zampini #endif 10013a40ed3dSBarry Smith PetscFunctionReturn(0); 1002289bc588SBarry Smith } 1003e8d4e0b9SBarry Smith 1004e0877f53SBarry Smith static PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 1005ae80bb75SLois Curfman McInnes { 1006ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1007ca15aa20SStefano Zampini const PetscScalar *vv; 100813f74950SBarry Smith PetscInt i,j; 1009ca15aa20SStefano Zampini PetscErrorCode ierr; 1010ae80bb75SLois Curfman McInnes 10113a40ed3dSBarry Smith PetscFunctionBegin; 1012ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1013ae80bb75SLois Curfman McInnes /* row-oriented output */ 1014ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 101597e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 1016e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 1017ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 10186f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 1019e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 1020ca15aa20SStefano Zampini *v++ = vv[indexn[j]*mat->lda + indexm[i]]; 1021ae80bb75SLois Curfman McInnes } 1022ae80bb75SLois Curfman McInnes } 1023ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 10243a40ed3dSBarry Smith PetscFunctionReturn(0); 1025ae80bb75SLois Curfman McInnes } 1026ae80bb75SLois Curfman McInnes 1027289bc588SBarry Smith /* -----------------------------------------------------------------*/ 1028289bc588SBarry Smith 10298491ab44SLisandro Dalcin PetscErrorCode MatView_Dense_Binary(Mat mat,PetscViewer viewer) 1030aabbc4fbSShri Abhyankar { 1031aabbc4fbSShri Abhyankar PetscErrorCode ierr; 10328491ab44SLisandro Dalcin PetscBool skipHeader; 10338491ab44SLisandro Dalcin PetscViewerFormat format; 10348491ab44SLisandro Dalcin PetscInt header[4],M,N,m,lda,i,j,k; 10358491ab44SLisandro Dalcin const PetscScalar *v; 10368491ab44SLisandro Dalcin PetscScalar *vwork; 1037aabbc4fbSShri Abhyankar 1038aabbc4fbSShri Abhyankar PetscFunctionBegin; 10398491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10408491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10418491ab44SLisandro Dalcin ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 10428491ab44SLisandro Dalcin if (skipHeader) format = PETSC_VIEWER_NATIVE; 1043aabbc4fbSShri Abhyankar 10448491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 10458491ab44SLisandro Dalcin 10468491ab44SLisandro Dalcin /* write matrix header */ 10478491ab44SLisandro Dalcin header[0] = MAT_FILE_CLASSID; header[1] = M; header[2] = N; 10488491ab44SLisandro Dalcin header[3] = (format == PETSC_VIEWER_NATIVE) ? MATRIX_BINARY_FORMAT_DENSE : M*N; 10498491ab44SLisandro Dalcin if (!skipHeader) {ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr);} 10508491ab44SLisandro Dalcin 10518491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 10528491ab44SLisandro Dalcin if (format != PETSC_VIEWER_NATIVE) { 10538491ab44SLisandro Dalcin PetscInt nnz = m*N, *iwork; 10548491ab44SLisandro Dalcin /* store row lengths for each row */ 10558491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&iwork);CHKERRQ(ierr); 10568491ab44SLisandro Dalcin for (i=0; i<m; i++) iwork[i] = N; 10578491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10588491ab44SLisandro Dalcin /* store column indices (zero start index) */ 10598491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10608491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10618491ab44SLisandro Dalcin iwork[k] = j; 10628491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10638491ab44SLisandro Dalcin ierr = PetscFree(iwork);CHKERRQ(ierr); 10648491ab44SLisandro Dalcin } 10658491ab44SLisandro Dalcin /* store matrix values as a dense matrix in row major order */ 10668491ab44SLisandro Dalcin ierr = PetscMalloc1(m*N,&vwork);CHKERRQ(ierr); 10678491ab44SLisandro Dalcin ierr = MatDenseGetArrayRead(mat,&v);CHKERRQ(ierr); 10688491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 10698491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10708491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10718491ab44SLisandro Dalcin vwork[k] = v[i+lda*j]; 10728491ab44SLisandro Dalcin ierr = MatDenseRestoreArrayRead(mat,&v);CHKERRQ(ierr); 10738491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,vwork,m*N,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 10748491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 10758491ab44SLisandro Dalcin PetscFunctionReturn(0); 10768491ab44SLisandro Dalcin } 10778491ab44SLisandro Dalcin 10788491ab44SLisandro Dalcin PetscErrorCode MatLoad_Dense_Binary(Mat mat,PetscViewer viewer) 10798491ab44SLisandro Dalcin { 10808491ab44SLisandro Dalcin PetscErrorCode ierr; 10818491ab44SLisandro Dalcin PetscBool skipHeader; 10828491ab44SLisandro Dalcin PetscInt header[4],M,N,m,nz,lda,i,j,k; 10838491ab44SLisandro Dalcin PetscInt rows,cols; 10848491ab44SLisandro Dalcin PetscScalar *v,*vwork; 10858491ab44SLisandro Dalcin 10868491ab44SLisandro Dalcin PetscFunctionBegin; 10878491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10888491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10898491ab44SLisandro Dalcin 10908491ab44SLisandro Dalcin if (!skipHeader) { 10918491ab44SLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 10928491ab44SLisandro Dalcin if (header[0] != MAT_FILE_CLASSID) SETERRQ(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 10938491ab44SLisandro Dalcin M = header[1]; N = header[2]; 10948491ab44SLisandro Dalcin if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M); 10958491ab44SLisandro Dalcin if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N); 10968491ab44SLisandro Dalcin nz = header[3]; 10978491ab44SLisandro Dalcin if (nz != MATRIX_BINARY_FORMAT_DENSE && nz < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Unknown matrix format %D in file",nz); 1098aabbc4fbSShri Abhyankar } else { 10998491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 11008491ab44SLisandro Dalcin if (M < 0 || N < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Matrix binary file header was skipped, thus the user must specify the global sizes of input matrix"); 11018491ab44SLisandro Dalcin nz = MATRIX_BINARY_FORMAT_DENSE; 1102e6324fbbSBarry Smith } 1103aabbc4fbSShri Abhyankar 11048491ab44SLisandro Dalcin /* setup global sizes if not set */ 11058491ab44SLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 11068491ab44SLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 11078491ab44SLisandro Dalcin ierr = MatSetUp(mat);CHKERRQ(ierr); 11088491ab44SLisandro Dalcin /* check if global sizes are correct */ 11098491ab44SLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 11108491ab44SLisandro Dalcin if (M != rows || N != cols) SETERRQ4(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 1111aabbc4fbSShri Abhyankar 11128491ab44SLisandro Dalcin ierr = MatGetSize(mat,NULL,&N);CHKERRQ(ierr); 11138491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 11148491ab44SLisandro Dalcin ierr = MatDenseGetArray(mat,&v);CHKERRQ(ierr); 11158491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 11168491ab44SLisandro Dalcin if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense format */ 11178491ab44SLisandro Dalcin PetscInt nnz = m*N; 11188491ab44SLisandro Dalcin /* read in matrix values */ 11198491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&vwork);CHKERRQ(ierr); 11208491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11218491ab44SLisandro Dalcin /* store values in column major order */ 11228491ab44SLisandro Dalcin for (j=0; j<N; j++) 11238491ab44SLisandro Dalcin for (i=0; i<m; i++) 11248491ab44SLisandro Dalcin v[i+lda*j] = vwork[i*N+j]; 11258491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 11268491ab44SLisandro Dalcin } else { /* matrix in file is sparse format */ 11278491ab44SLisandro Dalcin PetscInt nnz = 0, *rlens, *icols; 11288491ab44SLisandro Dalcin /* read in row lengths */ 11298491ab44SLisandro Dalcin ierr = PetscMalloc1(m,&rlens);CHKERRQ(ierr); 11308491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,rlens,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11318491ab44SLisandro Dalcin for (i=0; i<m; i++) nnz += rlens[i]; 11328491ab44SLisandro Dalcin /* read in column indices and values */ 11338491ab44SLisandro Dalcin ierr = PetscMalloc2(nnz,&icols,nnz,&vwork);CHKERRQ(ierr); 11348491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,icols,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11358491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11368491ab44SLisandro Dalcin /* store values in column major order */ 11378491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 11388491ab44SLisandro Dalcin for (j=0; j<rlens[i]; j++, k++) 11398491ab44SLisandro Dalcin v[i+lda*icols[k]] = vwork[k]; 11408491ab44SLisandro Dalcin ierr = PetscFree(rlens);CHKERRQ(ierr); 11418491ab44SLisandro Dalcin ierr = PetscFree2(icols,vwork);CHKERRQ(ierr); 1142aabbc4fbSShri Abhyankar } 11438491ab44SLisandro Dalcin ierr = MatDenseRestoreArray(mat,&v);CHKERRQ(ierr); 11448491ab44SLisandro Dalcin ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 11458491ab44SLisandro Dalcin ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1146aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 1147aabbc4fbSShri Abhyankar } 1148aabbc4fbSShri Abhyankar 1149eb91f321SVaclav Hapla PetscErrorCode MatLoad_SeqDense(Mat newMat, PetscViewer viewer) 1150eb91f321SVaclav Hapla { 1151eb91f321SVaclav Hapla PetscBool isbinary, ishdf5; 1152eb91f321SVaclav Hapla PetscErrorCode ierr; 1153eb91f321SVaclav Hapla 1154eb91f321SVaclav Hapla PetscFunctionBegin; 1155eb91f321SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 1156eb91f321SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 1157eb91f321SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 1158eb91f321SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 1159eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1160eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 1161eb91f321SVaclav Hapla if (isbinary) { 11628491ab44SLisandro Dalcin ierr = MatLoad_Dense_Binary(newMat,viewer);CHKERRQ(ierr); 1163eb91f321SVaclav Hapla } else if (ishdf5) { 1164eb91f321SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 1165eb91f321SVaclav Hapla ierr = MatLoad_Dense_HDF5(newMat,viewer);CHKERRQ(ierr); 1166eb91f321SVaclav Hapla #else 1167eb91f321SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 1168eb91f321SVaclav Hapla #endif 1169eb91f321SVaclav Hapla } else { 1170eb91f321SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 1171eb91f321SVaclav Hapla } 1172eb91f321SVaclav Hapla PetscFunctionReturn(0); 1173eb91f321SVaclav Hapla } 1174eb91f321SVaclav Hapla 11756849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 1176289bc588SBarry Smith { 1177932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1178dfbe8321SBarry Smith PetscErrorCode ierr; 117913f74950SBarry Smith PetscInt i,j; 11802dcb1b2aSMatthew Knepley const char *name; 1181ca15aa20SStefano Zampini PetscScalar *v,*av; 1182f3ef73ceSBarry Smith PetscViewerFormat format; 11835f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 1184ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 11855f481a85SSatish Balay #endif 1186932b0c3eSLois Curfman McInnes 11873a40ed3dSBarry Smith PetscFunctionBegin; 1188ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1189b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1190456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 11913a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 1192fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 1193d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1194d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1195ca15aa20SStefano Zampini v = av + i; 119677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 1197d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1198aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1199329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 120057622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",j,(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 1201329f5518SBarry Smith } else if (PetscRealPart(*v)) { 120257622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)PetscRealPart(*v));CHKERRQ(ierr); 12036831982aSBarry Smith } 120480cd9d93SLois Curfman McInnes #else 12056831982aSBarry Smith if (*v) { 120657622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)*v);CHKERRQ(ierr); 12076831982aSBarry Smith } 120880cd9d93SLois Curfman McInnes #endif 12091b807ce4Svictorle v += a->lda; 121080cd9d93SLois Curfman McInnes } 1211b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 121280cd9d93SLois Curfman McInnes } 1213d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 12143a40ed3dSBarry Smith } else { 1215d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1216aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 121747989497SBarry Smith /* determine if matrix has all real values */ 1218ca15aa20SStefano Zampini v = av; 1219d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 1220ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break;} 122147989497SBarry Smith } 122247989497SBarry Smith #endif 1223fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 12243a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 1225d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1226d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1227fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 1228ffac6cdbSBarry Smith } 1229ffac6cdbSBarry Smith 1230d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1231ca15aa20SStefano Zampini v = av + i; 1232d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1233aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 123447989497SBarry Smith if (allreal) { 1235c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)PetscRealPart(*v));CHKERRQ(ierr); 123647989497SBarry Smith } else { 1237c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16ei ",(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 123847989497SBarry Smith } 1239289bc588SBarry Smith #else 1240c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)*v);CHKERRQ(ierr); 1241289bc588SBarry Smith #endif 12421b807ce4Svictorle v += a->lda; 1243289bc588SBarry Smith } 1244b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 1245289bc588SBarry Smith } 1246fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 1247b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 1248ffac6cdbSBarry Smith } 1249d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 1250da3a660dSBarry Smith } 1251ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1252b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 12533a40ed3dSBarry Smith PetscFunctionReturn(0); 1254289bc588SBarry Smith } 1255289bc588SBarry Smith 12569804daf3SBarry Smith #include <petscdraw.h> 1257e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 1258f1af5d2fSBarry Smith { 1259f1af5d2fSBarry Smith Mat A = (Mat) Aa; 12606849ba73SBarry Smith PetscErrorCode ierr; 1261383922c3SLisandro Dalcin PetscInt m = A->rmap->n,n = A->cmap->n,i,j; 1262383922c3SLisandro Dalcin int color = PETSC_DRAW_WHITE; 1263ca15aa20SStefano Zampini const PetscScalar *v; 1264b0a32e0cSBarry Smith PetscViewer viewer; 1265b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 1266f3ef73ceSBarry Smith PetscViewerFormat format; 1267f1af5d2fSBarry Smith 1268f1af5d2fSBarry Smith PetscFunctionBegin; 1269f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 1270b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1271b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 1272f1af5d2fSBarry Smith 1273f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 1274ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 1275fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1276383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1277f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 1278f1af5d2fSBarry Smith for (j = 0; j < n; j++) { 1279383922c3SLisandro Dalcin x_l = j; x_r = x_l + 1.0; 1280f1af5d2fSBarry Smith for (i = 0; i < m; i++) { 1281f1af5d2fSBarry Smith y_l = m - i - 1.0; 1282f1af5d2fSBarry Smith y_r = y_l + 1.0; 1283ca15aa20SStefano Zampini if (PetscRealPart(v[j*m+i]) > 0.) color = PETSC_DRAW_RED; 1284ca15aa20SStefano Zampini else if (PetscRealPart(v[j*m+i]) < 0.) color = PETSC_DRAW_BLUE; 1285ca15aa20SStefano Zampini else continue; 1286b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1287f1af5d2fSBarry Smith } 1288f1af5d2fSBarry Smith } 1289383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1290f1af5d2fSBarry Smith } else { 1291f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1292f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1293b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1294b05fc000SLisandro Dalcin PetscDraw popup; 1295b05fc000SLisandro Dalcin 1296f1af5d2fSBarry Smith for (i=0; i < m*n; i++) { 1297f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1298f1af5d2fSBarry Smith } 1299383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 1300b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 130145f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 1302383922c3SLisandro Dalcin 1303383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1304f1af5d2fSBarry Smith for (j=0; j<n; j++) { 1305f1af5d2fSBarry Smith x_l = j; 1306f1af5d2fSBarry Smith x_r = x_l + 1.0; 1307f1af5d2fSBarry Smith for (i=0; i<m; i++) { 1308f1af5d2fSBarry Smith y_l = m - i - 1.0; 1309f1af5d2fSBarry Smith y_r = y_l + 1.0; 1310b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(v[j*m+i]),minv,maxv); 1311b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1312f1af5d2fSBarry Smith } 1313f1af5d2fSBarry Smith } 1314383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1315f1af5d2fSBarry Smith } 1316ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 1317f1af5d2fSBarry Smith PetscFunctionReturn(0); 1318f1af5d2fSBarry Smith } 1319f1af5d2fSBarry Smith 1320e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1321f1af5d2fSBarry Smith { 1322b0a32e0cSBarry Smith PetscDraw draw; 1323ace3abfcSBarry Smith PetscBool isnull; 1324329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1325dfbe8321SBarry Smith PetscErrorCode ierr; 1326f1af5d2fSBarry Smith 1327f1af5d2fSBarry Smith PetscFunctionBegin; 1328b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1329b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1330abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1331f1af5d2fSBarry Smith 1332d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1333f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1334b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1335832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1336b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 13370298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1338832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 1339f1af5d2fSBarry Smith PetscFunctionReturn(0); 1340f1af5d2fSBarry Smith } 1341f1af5d2fSBarry Smith 1342dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1343932b0c3eSLois Curfman McInnes { 1344dfbe8321SBarry Smith PetscErrorCode ierr; 1345ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1346932b0c3eSLois Curfman McInnes 13473a40ed3dSBarry Smith PetscFunctionBegin; 1348251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1349251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1350251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 13510f5bd95cSBarry Smith 1352c45a1595SBarry Smith if (iascii) { 1353c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 13540f5bd95cSBarry Smith } else if (isbinary) { 1355637a0070SStefano Zampini ierr = MatView_Dense_Binary(A,viewer);CHKERRQ(ierr); 1356f1af5d2fSBarry Smith } else if (isdraw) { 1357f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 1358932b0c3eSLois Curfman McInnes } 13593a40ed3dSBarry Smith PetscFunctionReturn(0); 1360932b0c3eSLois Curfman McInnes } 1361289bc588SBarry Smith 1362637a0070SStefano Zampini static PetscErrorCode MatDensePlaceArray_SeqDense(Mat A,const PetscScalar *array) 1363d3042a70SBarry Smith { 1364d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1365d3042a70SBarry Smith 1366d3042a70SBarry Smith PetscFunctionBegin; 13676947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1368d5ea218eSStefano Zampini if (a->unplacedarray) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreArray first"); 1369d3042a70SBarry Smith a->unplacedarray = a->v; 1370d3042a70SBarry Smith a->unplaced_user_alloc = a->user_alloc; 1371d3042a70SBarry Smith a->v = (PetscScalar*) array; 1372637a0070SStefano Zampini a->user_alloc = PETSC_TRUE; 1373ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1374c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1375ca15aa20SStefano Zampini #endif 1376d3042a70SBarry Smith PetscFunctionReturn(0); 1377d3042a70SBarry Smith } 1378d3042a70SBarry Smith 1379d3042a70SBarry Smith static PetscErrorCode MatDenseResetArray_SeqDense(Mat A) 1380d3042a70SBarry Smith { 1381d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1382d3042a70SBarry Smith 1383d3042a70SBarry Smith PetscFunctionBegin; 13846947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1385d3042a70SBarry Smith a->v = a->unplacedarray; 1386d3042a70SBarry Smith a->user_alloc = a->unplaced_user_alloc; 1387d3042a70SBarry Smith a->unplacedarray = NULL; 1388ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1389c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1390ca15aa20SStefano Zampini #endif 1391d3042a70SBarry Smith PetscFunctionReturn(0); 1392d3042a70SBarry Smith } 1393d3042a70SBarry Smith 1394d5ea218eSStefano Zampini static PetscErrorCode MatDenseReplaceArray_SeqDense(Mat A,const PetscScalar *array) 1395d5ea218eSStefano Zampini { 1396d5ea218eSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1397d5ea218eSStefano Zampini PetscErrorCode ierr; 1398d5ea218eSStefano Zampini 1399d5ea218eSStefano Zampini PetscFunctionBegin; 1400d5ea218eSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1401d5ea218eSStefano Zampini if (!a->user_alloc) { ierr = PetscFree(a->v);CHKERRQ(ierr); } 1402d5ea218eSStefano Zampini a->v = (PetscScalar*) array; 1403d5ea218eSStefano Zampini a->user_alloc = PETSC_FALSE; 1404d5ea218eSStefano Zampini #if defined(PETSC_HAVE_CUDA) 1405d5ea218eSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1406d5ea218eSStefano Zampini #endif 1407d5ea218eSStefano Zampini PetscFunctionReturn(0); 1408d5ea218eSStefano Zampini } 1409d5ea218eSStefano Zampini 1410ca15aa20SStefano Zampini PetscErrorCode MatDestroy_SeqDense(Mat mat) 1411289bc588SBarry Smith { 1412ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1413dfbe8321SBarry Smith PetscErrorCode ierr; 141490f02eecSBarry Smith 14153a40ed3dSBarry Smith PetscFunctionBegin; 1416aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1417d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1418a5a9c739SBarry Smith #endif 141905b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 1420a49dc2a2SStefano Zampini ierr = PetscFree(l->fwork);CHKERRQ(ierr); 1421abc3b08eSStefano Zampini ierr = MatDestroy(&l->ptapwork);CHKERRQ(ierr); 14226857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1423637a0070SStefano Zampini if (!l->unplaced_user_alloc) {ierr = PetscFree(l->unplacedarray);CHKERRQ(ierr);} 14246947451fSStefano Zampini ierr = VecDestroy(&l->cvec);CHKERRQ(ierr); 1425bf0cc555SLisandro Dalcin ierr = PetscFree(mat->data);CHKERRQ(ierr); 1426dbd8c25aSHong Zhang 1427dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 142849a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetLDA_C",NULL);CHKERRQ(ierr); 1429*ad16ce7aSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseSetLDA_C",NULL);CHKERRQ(ierr); 1430bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArray_C",NULL);CHKERRQ(ierr); 143152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArray_C",NULL);CHKERRQ(ierr); 1432d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDensePlaceArray_C",NULL);CHKERRQ(ierr); 1433d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseResetArray_C",NULL);CHKERRQ(ierr); 1434d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseReplaceArray_C",NULL);CHKERRQ(ierr); 143552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayRead_C",NULL);CHKERRQ(ierr); 143652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayRead_C",NULL);CHKERRQ(ierr); 14376947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayWrite_C",NULL);CHKERRQ(ierr); 14386947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayWrite_C",NULL);CHKERRQ(ierr); 14398baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 14408baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 14418baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_elemental_C",NULL);CHKERRQ(ierr); 14428baccfbdSHong Zhang #endif 14432bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 14442bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqdensecuda_C",NULL);CHKERRQ(ierr); 14454222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",NULL);CHKERRQ(ierr); 14464222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdense_C",NULL);CHKERRQ(ierr); 14474222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",NULL);CHKERRQ(ierr); 14482bf066beSStefano Zampini #endif 1449bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatSeqDenseSetPreallocation_C",NULL);CHKERRQ(ierr); 14504222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14514222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdense_seqdense_C",NULL);CHKERRQ(ierr); 1452bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1453bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14544222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1455a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1456a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 14574222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1458c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1459c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 146052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 146152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 146252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 146352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 146452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 146552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 146652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_nest_seqdense_C",NULL);CHKERRQ(ierr); 146752c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_nest_seqdense_C",NULL);CHKERRQ(ierr); 146852c5f739Sprj- 14693bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14703bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 147152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 147252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 147352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 147452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 147552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 147652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 147786aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumn_C",NULL);CHKERRQ(ierr); 147886aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumn_C",NULL);CHKERRQ(ierr); 14796947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVec_C",NULL);CHKERRQ(ierr); 14806947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVec_C",NULL);CHKERRQ(ierr); 14816947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecRead_C",NULL);CHKERRQ(ierr); 14826947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecRead_C",NULL);CHKERRQ(ierr); 14836947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecWrite_C",NULL);CHKERRQ(ierr); 14846947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecWrite_C",NULL);CHKERRQ(ierr); 14853a40ed3dSBarry Smith PetscFunctionReturn(0); 1486289bc588SBarry Smith } 1487289bc588SBarry Smith 1488e0877f53SBarry Smith static PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1489289bc588SBarry Smith { 1490c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 14916849ba73SBarry Smith PetscErrorCode ierr; 149213f74950SBarry Smith PetscInt k,j,m,n,M; 149387828ca2SBarry Smith PetscScalar *v,tmp; 149448b35521SBarry Smith 14953a40ed3dSBarry Smith PetscFunctionBegin; 1496ca15aa20SStefano Zampini m = A->rmap->n; M = mat->lda; n = A->cmap->n; 14972847e3fdSStefano Zampini if (reuse == MAT_INPLACE_MATRIX && m == n) { /* in place transpose */ 1498ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1499d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1500289bc588SBarry Smith for (k=0; k<j; k++) { 15011b807ce4Svictorle tmp = v[j + k*M]; 15021b807ce4Svictorle v[j + k*M] = v[k + j*M]; 15031b807ce4Svictorle v[k + j*M] = tmp; 1504289bc588SBarry Smith } 1505289bc588SBarry Smith } 1506ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 15073a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1508d3e5ee88SLois Curfman McInnes Mat tmat; 1509ec8511deSBarry Smith Mat_SeqDense *tmatd; 151087828ca2SBarry Smith PetscScalar *v2; 1511af36a384SStefano Zampini PetscInt M2; 1512ea709b57SSatish Balay 15132847e3fdSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 1514ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&tmat);CHKERRQ(ierr); 1515d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 15167adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 15170298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(tmat,NULL);CHKERRQ(ierr); 1518ca15aa20SStefano Zampini } else tmat = *matout; 1519ca15aa20SStefano Zampini 1520ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 1521ca15aa20SStefano Zampini ierr = MatDenseGetArray(tmat,&v2);CHKERRQ(ierr); 1522ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 1523ca15aa20SStefano Zampini M2 = tmatd->lda; 1524d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 1525af36a384SStefano Zampini for (k=0; k<m; k++) v2[j + k*M2] = v[k + j*M]; 1526d3e5ee88SLois Curfman McInnes } 1527ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(tmat,&v2);CHKERRQ(ierr); 1528ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 15296d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15306d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15312847e3fdSStefano Zampini if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) *matout = tmat; 15322847e3fdSStefano Zampini else { 15332847e3fdSStefano Zampini ierr = MatHeaderMerge(A,&tmat);CHKERRQ(ierr); 15342847e3fdSStefano Zampini } 153548b35521SBarry Smith } 15363a40ed3dSBarry Smith PetscFunctionReturn(0); 1537289bc588SBarry Smith } 1538289bc588SBarry Smith 1539e0877f53SBarry Smith static PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1540289bc588SBarry Smith { 1541c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1542c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 1543ca15aa20SStefano Zampini PetscInt i; 1544ca15aa20SStefano Zampini const PetscScalar *v1,*v2; 1545ca15aa20SStefano Zampini PetscErrorCode ierr; 15469ea5d5aeSSatish Balay 15473a40ed3dSBarry Smith PetscFunctionBegin; 1548d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1549d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1550ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A1,&v1);CHKERRQ(ierr); 1551ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A2,&v2);CHKERRQ(ierr); 1552ca15aa20SStefano Zampini for (i=0; i<A1->cmap->n; i++) { 1553ca15aa20SStefano Zampini ierr = PetscArraycmp(v1,v2,A1->rmap->n,flg);CHKERRQ(ierr); 1554ca15aa20SStefano Zampini if (*flg == PETSC_FALSE) PetscFunctionReturn(0); 1555ca15aa20SStefano Zampini v1 += mat1->lda; 1556ca15aa20SStefano Zampini v2 += mat2->lda; 15571b807ce4Svictorle } 1558ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A1,&v1);CHKERRQ(ierr); 1559ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A2,&v2);CHKERRQ(ierr); 156077c4ece6SBarry Smith *flg = PETSC_TRUE; 15613a40ed3dSBarry Smith PetscFunctionReturn(0); 1562289bc588SBarry Smith } 1563289bc588SBarry Smith 1564e0877f53SBarry Smith static PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1565289bc588SBarry Smith { 1566c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 156713f74950SBarry Smith PetscInt i,n,len; 1568ca15aa20SStefano Zampini PetscScalar *x; 1569ca15aa20SStefano Zampini const PetscScalar *vv; 1570ca15aa20SStefano Zampini PetscErrorCode ierr; 157144cd7ae7SLois Curfman McInnes 15723a40ed3dSBarry Smith PetscFunctionBegin; 15737a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 15741ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1575d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1576ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1577e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 157844cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 1579ca15aa20SStefano Zampini x[i] = vv[i*mat->lda + i]; 1580289bc588SBarry Smith } 1581ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 15821ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 15833a40ed3dSBarry Smith PetscFunctionReturn(0); 1584289bc588SBarry Smith } 1585289bc588SBarry Smith 1586e0877f53SBarry Smith static PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1587289bc588SBarry Smith { 1588c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1589f1ceaac6SMatthew G. Knepley const PetscScalar *l,*r; 1590ca15aa20SStefano Zampini PetscScalar x,*v,*vv; 1591dfbe8321SBarry Smith PetscErrorCode ierr; 1592d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 159355659b69SBarry Smith 15943a40ed3dSBarry Smith PetscFunctionBegin; 1595ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&vv);CHKERRQ(ierr); 159628988994SBarry Smith if (ll) { 15977a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 1598f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 1599e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1600da3a660dSBarry Smith for (i=0; i<m; i++) { 1601da3a660dSBarry Smith x = l[i]; 1602ca15aa20SStefano Zampini v = vv + i; 1603b43bac26SStefano Zampini for (j=0; j<n; j++) { (*v) *= x; v+= mat->lda;} 1604da3a660dSBarry Smith } 1605f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 1606eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1607da3a660dSBarry Smith } 160828988994SBarry Smith if (rr) { 16097a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 1610f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 1611e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1612da3a660dSBarry Smith for (i=0; i<n; i++) { 1613da3a660dSBarry Smith x = r[i]; 1614ca15aa20SStefano Zampini v = vv + i*mat->lda; 16152205254eSKarl Rupp for (j=0; j<m; j++) (*v++) *= x; 1616da3a660dSBarry Smith } 1617f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 1618eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1619da3a660dSBarry Smith } 1620ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&vv);CHKERRQ(ierr); 16213a40ed3dSBarry Smith PetscFunctionReturn(0); 1622289bc588SBarry Smith } 1623289bc588SBarry Smith 1624ca15aa20SStefano Zampini PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1625289bc588SBarry Smith { 1626c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1627ca15aa20SStefano Zampini PetscScalar *v,*vv; 1628329f5518SBarry Smith PetscReal sum = 0.0; 1629d0f46423SBarry Smith PetscInt lda =mat->lda,m=A->rmap->n,i,j; 1630efee365bSSatish Balay PetscErrorCode ierr; 163155659b69SBarry Smith 16323a40ed3dSBarry Smith PetscFunctionBegin; 1633ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 1634ca15aa20SStefano Zampini v = vv; 1635289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1636a5ce6ee0Svictorle if (lda>m) { 1637d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1638ca15aa20SStefano Zampini v = vv+j*lda; 1639a5ce6ee0Svictorle for (i=0; i<m; i++) { 1640a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1641a5ce6ee0Svictorle } 1642a5ce6ee0Svictorle } 1643a5ce6ee0Svictorle } else { 1644570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 1645570b7f6dSBarry Smith PetscBLASInt one = 1,cnt = A->cmap->n*A->rmap->n; 1646570b7f6dSBarry Smith *nrm = BLASnrm2_(&cnt,v,&one); 1647570b7f6dSBarry Smith } 1648570b7f6dSBarry Smith #else 1649d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1650329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1651289bc588SBarry Smith } 1652a5ce6ee0Svictorle } 16538f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 1654570b7f6dSBarry Smith #endif 1655dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16563a40ed3dSBarry Smith } else if (type == NORM_1) { 1657064f8208SBarry Smith *nrm = 0.0; 1658d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1659ca15aa20SStefano Zampini v = vv + j*mat->lda; 1660289bc588SBarry Smith sum = 0.0; 1661d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 166233a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1663289bc588SBarry Smith } 1664064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1665289bc588SBarry Smith } 1666eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16673a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1668064f8208SBarry Smith *nrm = 0.0; 1669d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1670ca15aa20SStefano Zampini v = vv + j; 1671289bc588SBarry Smith sum = 0.0; 1672d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 16731b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1674289bc588SBarry Smith } 1675064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1676289bc588SBarry Smith } 1677eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1678e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 1679ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 16803a40ed3dSBarry Smith PetscFunctionReturn(0); 1681289bc588SBarry Smith } 1682289bc588SBarry Smith 1683e0877f53SBarry Smith static PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1684289bc588SBarry Smith { 1685c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 168663ba0a88SBarry Smith PetscErrorCode ierr; 168767e560aaSBarry Smith 16883a40ed3dSBarry Smith PetscFunctionBegin; 1689b5a2b587SKris Buschelman switch (op) { 1690b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 16914e0d8c25SBarry Smith aij->roworiented = flg; 1692b5a2b587SKris Buschelman break; 1693512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1694b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 16953971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 16964e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 169713fa8e87SLisandro Dalcin case MAT_KEEP_NONZERO_PATTERN: 1698b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1699b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 17000f8fb01aSBarry Smith case MAT_IGNORE_ZERO_ENTRIES: 17015021d80fSJed Brown case MAT_IGNORE_LOWER_TRIANGULAR: 1702071fcb05SBarry Smith case MAT_SORTED_FULL: 17035021d80fSJed Brown ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 17045021d80fSJed Brown break; 17055021d80fSJed Brown case MAT_SPD: 170677e54ba9SKris Buschelman case MAT_SYMMETRIC: 170777e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 17089a4540c5SBarry Smith case MAT_HERMITIAN: 17099a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 17105021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 171177e54ba9SKris Buschelman break; 1712b5a2b587SKris Buschelman default: 1713e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 17143a40ed3dSBarry Smith } 17153a40ed3dSBarry Smith PetscFunctionReturn(0); 1716289bc588SBarry Smith } 1717289bc588SBarry Smith 1718e0877f53SBarry Smith static PetscErrorCode MatZeroEntries_SeqDense(Mat A) 17196f0a148fSBarry Smith { 1720ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 17216849ba73SBarry Smith PetscErrorCode ierr; 1722d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 1723ca15aa20SStefano Zampini PetscScalar *v; 17243a40ed3dSBarry Smith 17253a40ed3dSBarry Smith PetscFunctionBegin; 1726ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1727a5ce6ee0Svictorle if (lda>m) { 1728d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1729ca15aa20SStefano Zampini ierr = PetscArrayzero(v+j*lda,m);CHKERRQ(ierr); 1730a5ce6ee0Svictorle } 1731a5ce6ee0Svictorle } else { 1732ca15aa20SStefano Zampini ierr = PetscArrayzero(v,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 1733a5ce6ee0Svictorle } 1734ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17353a40ed3dSBarry Smith PetscFunctionReturn(0); 17366f0a148fSBarry Smith } 17376f0a148fSBarry Smith 1738e0877f53SBarry Smith static PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17396f0a148fSBarry Smith { 174097b48c8fSBarry Smith PetscErrorCode ierr; 1741ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1742b9679d65SBarry Smith PetscInt m = l->lda, n = A->cmap->n, i,j; 1743ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 174497b48c8fSBarry Smith const PetscScalar *xx; 174555659b69SBarry Smith 17463a40ed3dSBarry Smith PetscFunctionBegin; 174776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1748b9679d65SBarry Smith for (i=0; i<N; i++) { 1749b9679d65SBarry Smith if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1750b9679d65SBarry Smith if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1751b9679d65SBarry Smith } 175276bd3646SJed Brown } 1753ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1754b9679d65SBarry Smith 175597b48c8fSBarry Smith /* fix right hand side if needed */ 175697b48c8fSBarry Smith if (x && b) { 175797b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 175897b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17592205254eSKarl Rupp for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 176097b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 176197b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 176297b48c8fSBarry Smith } 176397b48c8fSBarry Smith 1764ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 17656f0a148fSBarry Smith for (i=0; i<N; i++) { 1766ca15aa20SStefano Zampini slot = v + rows[i]; 1767b9679d65SBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 17686f0a148fSBarry Smith } 1769f4df32b1SMatthew Knepley if (diag != 0.0) { 1770b9679d65SBarry Smith if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 17716f0a148fSBarry Smith for (i=0; i<N; i++) { 1772ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1773f4df32b1SMatthew Knepley *slot = diag; 17746f0a148fSBarry Smith } 17756f0a148fSBarry Smith } 1776ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17773a40ed3dSBarry Smith PetscFunctionReturn(0); 17786f0a148fSBarry Smith } 1779557bce09SLois Curfman McInnes 178049a6ff4bSBarry Smith static PetscErrorCode MatDenseGetLDA_SeqDense(Mat A,PetscInt *lda) 178149a6ff4bSBarry Smith { 178249a6ff4bSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 178349a6ff4bSBarry Smith 178449a6ff4bSBarry Smith PetscFunctionBegin; 178549a6ff4bSBarry Smith *lda = mat->lda; 178649a6ff4bSBarry Smith PetscFunctionReturn(0); 178749a6ff4bSBarry Smith } 178849a6ff4bSBarry Smith 1789637a0070SStefano Zampini PetscErrorCode MatDenseGetArray_SeqDense(Mat A,PetscScalar **array) 179064e87e97SBarry Smith { 1791c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 17923a40ed3dSBarry Smith 17933a40ed3dSBarry Smith PetscFunctionBegin; 179464e87e97SBarry Smith *array = mat->v; 17953a40ed3dSBarry Smith PetscFunctionReturn(0); 179664e87e97SBarry Smith } 17970754003eSLois Curfman McInnes 1798637a0070SStefano Zampini PetscErrorCode MatDenseRestoreArray_SeqDense(Mat A,PetscScalar **array) 1799ff14e315SSatish Balay { 18003a40ed3dSBarry Smith PetscFunctionBegin; 1801637a0070SStefano Zampini *array = NULL; 18023a40ed3dSBarry Smith PetscFunctionReturn(0); 1803ff14e315SSatish Balay } 18040754003eSLois Curfman McInnes 1805dec5eb66SMatthew G Knepley /*@C 180649a6ff4bSBarry Smith MatDenseGetLDA - gets the leading dimension of the array returned from MatDenseGetArray() 180749a6ff4bSBarry Smith 1808*ad16ce7aSStefano Zampini Not collective 180949a6ff4bSBarry Smith 181049a6ff4bSBarry Smith Input Parameter: 181149a6ff4bSBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 181249a6ff4bSBarry Smith 181349a6ff4bSBarry Smith Output Parameter: 181449a6ff4bSBarry Smith . lda - the leading dimension 181549a6ff4bSBarry Smith 181649a6ff4bSBarry Smith Level: intermediate 181749a6ff4bSBarry Smith 1818*ad16ce7aSStefano Zampini .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseSetLDA() 181949a6ff4bSBarry Smith @*/ 182049a6ff4bSBarry Smith PetscErrorCode MatDenseGetLDA(Mat A,PetscInt *lda) 182149a6ff4bSBarry Smith { 182249a6ff4bSBarry Smith PetscErrorCode ierr; 182349a6ff4bSBarry Smith 182449a6ff4bSBarry Smith PetscFunctionBegin; 1825d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1826d5ea218eSStefano Zampini PetscValidPointer(lda,2); 182749a6ff4bSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetLDA_C",(Mat,PetscInt*),(A,lda));CHKERRQ(ierr); 182849a6ff4bSBarry Smith PetscFunctionReturn(0); 182949a6ff4bSBarry Smith } 183049a6ff4bSBarry Smith 183149a6ff4bSBarry Smith /*@C 1832*ad16ce7aSStefano Zampini MatDenseSetLDA - Sets the leading dimension of the array used by the dense matrix 1833*ad16ce7aSStefano Zampini 1834*ad16ce7aSStefano Zampini Not collective 1835*ad16ce7aSStefano Zampini 1836*ad16ce7aSStefano Zampini Input Parameter: 1837*ad16ce7aSStefano Zampini + mat - a MATSEQDENSE or MATMPIDENSE matrix 1838*ad16ce7aSStefano Zampini - lda - the leading dimension 1839*ad16ce7aSStefano Zampini 1840*ad16ce7aSStefano Zampini Level: intermediate 1841*ad16ce7aSStefano Zampini 1842*ad16ce7aSStefano Zampini .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetLDA() 1843*ad16ce7aSStefano Zampini @*/ 1844*ad16ce7aSStefano Zampini PetscErrorCode MatDenseSetLDA(Mat A,PetscInt lda) 1845*ad16ce7aSStefano Zampini { 1846*ad16ce7aSStefano Zampini PetscErrorCode ierr; 1847*ad16ce7aSStefano Zampini 1848*ad16ce7aSStefano Zampini PetscFunctionBegin; 1849*ad16ce7aSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1850*ad16ce7aSStefano Zampini ierr = PetscTryMethod(A,"MatDenseSetLDA_C",(Mat,PetscInt),(A,lda));CHKERRQ(ierr); 1851*ad16ce7aSStefano Zampini PetscFunctionReturn(0); 1852*ad16ce7aSStefano Zampini } 1853*ad16ce7aSStefano Zampini 1854*ad16ce7aSStefano Zampini /*@C 18556947451fSStefano Zampini MatDenseGetArray - gives read-write access to the array where the data for a dense matrix is stored 185673a71a0fSBarry Smith 18578572280aSBarry Smith Logically Collective on Mat 185873a71a0fSBarry Smith 185973a71a0fSBarry Smith Input Parameter: 18606947451fSStefano Zampini . mat - a dense matrix 186173a71a0fSBarry Smith 186273a71a0fSBarry Smith Output Parameter: 186373a71a0fSBarry Smith . array - pointer to the data 186473a71a0fSBarry Smith 186573a71a0fSBarry Smith Level: intermediate 186673a71a0fSBarry Smith 18676947451fSStefano Zampini .seealso: MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 186873a71a0fSBarry Smith @*/ 18698c778c55SBarry Smith PetscErrorCode MatDenseGetArray(Mat A,PetscScalar **array) 187073a71a0fSBarry Smith { 187173a71a0fSBarry Smith PetscErrorCode ierr; 187273a71a0fSBarry Smith 187373a71a0fSBarry Smith PetscFunctionBegin; 1874d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1875d5ea218eSStefano Zampini PetscValidPointer(array,2); 18768c778c55SBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 187773a71a0fSBarry Smith PetscFunctionReturn(0); 187873a71a0fSBarry Smith } 187973a71a0fSBarry Smith 1880dec5eb66SMatthew G Knepley /*@C 1881579dbff0SBarry Smith MatDenseRestoreArray - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArray() 188273a71a0fSBarry Smith 18838572280aSBarry Smith Logically Collective on Mat 18848572280aSBarry Smith 18858572280aSBarry Smith Input Parameters: 18866947451fSStefano Zampini + mat - a dense matrix 1887a2b725a8SWilliam Gropp - array - pointer to the data 18888572280aSBarry Smith 18898572280aSBarry Smith Level: intermediate 18908572280aSBarry Smith 18916947451fSStefano Zampini .seealso: MatDenseGetArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 18928572280aSBarry Smith @*/ 18938572280aSBarry Smith PetscErrorCode MatDenseRestoreArray(Mat A,PetscScalar **array) 18948572280aSBarry Smith { 18958572280aSBarry Smith PetscErrorCode ierr; 18968572280aSBarry Smith 18978572280aSBarry Smith PetscFunctionBegin; 1898d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1899d5ea218eSStefano Zampini PetscValidPointer(array,2); 19008572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19018572280aSBarry Smith ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 1902637a0070SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1903637a0070SStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1904637a0070SStefano Zampini #endif 19058572280aSBarry Smith PetscFunctionReturn(0); 19068572280aSBarry Smith } 19078572280aSBarry Smith 19088572280aSBarry Smith /*@C 19096947451fSStefano Zampini MatDenseGetArrayRead - gives read-only access to the array where the data for a dense matrix is stored 19108572280aSBarry Smith 19118572280aSBarry Smith Not Collective 19128572280aSBarry Smith 19138572280aSBarry Smith Input Parameter: 19146947451fSStefano Zampini . mat - a dense matrix 19158572280aSBarry Smith 19168572280aSBarry Smith Output Parameter: 19178572280aSBarry Smith . array - pointer to the data 19188572280aSBarry Smith 19198572280aSBarry Smith Level: intermediate 19208572280aSBarry Smith 19216947451fSStefano Zampini .seealso: MatDenseRestoreArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 19228572280aSBarry Smith @*/ 19238572280aSBarry Smith PetscErrorCode MatDenseGetArrayRead(Mat A,const PetscScalar **array) 19248572280aSBarry Smith { 19258572280aSBarry Smith PetscErrorCode ierr; 19268572280aSBarry Smith 19278572280aSBarry Smith PetscFunctionBegin; 1928d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1929d5ea218eSStefano Zampini PetscValidPointer(array,2); 19308572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 19318572280aSBarry Smith PetscFunctionReturn(0); 19328572280aSBarry Smith } 19338572280aSBarry Smith 19348572280aSBarry Smith /*@C 19356947451fSStefano Zampini MatDenseRestoreArrayRead - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayRead() 19368572280aSBarry Smith 193773a71a0fSBarry Smith Not Collective 193873a71a0fSBarry Smith 193973a71a0fSBarry Smith Input Parameters: 19406947451fSStefano Zampini + mat - a dense matrix 1941a2b725a8SWilliam Gropp - array - pointer to the data 194273a71a0fSBarry Smith 194373a71a0fSBarry Smith Level: intermediate 194473a71a0fSBarry Smith 19456947451fSStefano Zampini .seealso: MatDenseGetArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 194673a71a0fSBarry Smith @*/ 19478572280aSBarry Smith PetscErrorCode MatDenseRestoreArrayRead(Mat A,const PetscScalar **array) 194873a71a0fSBarry Smith { 194973a71a0fSBarry Smith PetscErrorCode ierr; 195073a71a0fSBarry Smith 195173a71a0fSBarry Smith PetscFunctionBegin; 1952d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1953d5ea218eSStefano Zampini PetscValidPointer(array,2); 19548572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 195573a71a0fSBarry Smith PetscFunctionReturn(0); 195673a71a0fSBarry Smith } 195773a71a0fSBarry Smith 19586947451fSStefano Zampini /*@C 19596947451fSStefano Zampini MatDenseGetArrayWrite - gives write-only access to the array where the data for a dense matrix is stored 19606947451fSStefano Zampini 19616947451fSStefano Zampini Not Collective 19626947451fSStefano Zampini 19636947451fSStefano Zampini Input Parameter: 19646947451fSStefano Zampini . mat - a dense matrix 19656947451fSStefano Zampini 19666947451fSStefano Zampini Output Parameter: 19676947451fSStefano Zampini . array - pointer to the data 19686947451fSStefano Zampini 19696947451fSStefano Zampini Level: intermediate 19706947451fSStefano Zampini 19716947451fSStefano Zampini .seealso: MatDenseRestoreArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19726947451fSStefano Zampini @*/ 19736947451fSStefano Zampini PetscErrorCode MatDenseGetArrayWrite(Mat A,PetscScalar **array) 19746947451fSStefano Zampini { 19756947451fSStefano Zampini PetscErrorCode ierr; 19766947451fSStefano Zampini 19776947451fSStefano Zampini PetscFunctionBegin; 1978d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1979d5ea218eSStefano Zampini PetscValidPointer(array,2); 19806947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19816947451fSStefano Zampini PetscFunctionReturn(0); 19826947451fSStefano Zampini } 19836947451fSStefano Zampini 19846947451fSStefano Zampini /*@C 19856947451fSStefano Zampini MatDenseRestoreArrayWrite - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayWrite() 19866947451fSStefano Zampini 19876947451fSStefano Zampini Not Collective 19886947451fSStefano Zampini 19896947451fSStefano Zampini Input Parameters: 19906947451fSStefano Zampini + mat - a dense matrix 19916947451fSStefano Zampini - array - pointer to the data 19926947451fSStefano Zampini 19936947451fSStefano Zampini Level: intermediate 19946947451fSStefano Zampini 19956947451fSStefano Zampini .seealso: MatDenseGetArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19966947451fSStefano Zampini @*/ 19976947451fSStefano Zampini PetscErrorCode MatDenseRestoreArrayWrite(Mat A,PetscScalar **array) 19986947451fSStefano Zampini { 19996947451fSStefano Zampini PetscErrorCode ierr; 20006947451fSStefano Zampini 20016947451fSStefano Zampini PetscFunctionBegin; 2002d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 2003d5ea218eSStefano Zampini PetscValidPointer(array,2); 20046947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 20056947451fSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 20066947451fSStefano Zampini #if defined(PETSC_HAVE_CUDA) 20076947451fSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 20086947451fSStefano Zampini #endif 20096947451fSStefano Zampini PetscFunctionReturn(0); 20106947451fSStefano Zampini } 20116947451fSStefano Zampini 20127dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 20130754003eSLois Curfman McInnes { 2014c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 20156849ba73SBarry Smith PetscErrorCode ierr; 2016ca15aa20SStefano Zampini PetscInt i,j,nrows,ncols,blda; 20175d0c19d7SBarry Smith const PetscInt *irow,*icol; 201887828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 20190754003eSLois Curfman McInnes Mat newmat; 20200754003eSLois Curfman McInnes 20213a40ed3dSBarry Smith PetscFunctionBegin; 202278b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 202378b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 2024e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2025e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 20260754003eSLois Curfman McInnes 2027182d2002SSatish Balay /* Check submatrixcall */ 2028182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 202913f74950SBarry Smith PetscInt n_cols,n_rows; 2030182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 203121a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 2032f746d493SDmitry Karpeev /* resize the result matrix to match number of requested rows/columns */ 2033c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 203421a2c019SBarry Smith } 2035182d2002SSatish Balay newmat = *B; 2036182d2002SSatish Balay } else { 20370754003eSLois Curfman McInnes /* Create and fill new matrix */ 2038ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&newmat);CHKERRQ(ierr); 2039f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 20407adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 20410298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newmat,NULL);CHKERRQ(ierr); 2042182d2002SSatish Balay } 2043182d2002SSatish Balay 2044182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 2045ca15aa20SStefano Zampini ierr = MatDenseGetArray(newmat,&bv);CHKERRQ(ierr); 2046ca15aa20SStefano Zampini ierr = MatDenseGetLDA(newmat,&blda);CHKERRQ(ierr); 2047182d2002SSatish Balay for (i=0; i<ncols; i++) { 20486de62eeeSBarry Smith av = v + mat->lda*icol[i]; 2049ca15aa20SStefano Zampini for (j=0; j<nrows; j++) bv[j] = av[irow[j]]; 2050ca15aa20SStefano Zampini bv += blda; 20510754003eSLois Curfman McInnes } 2052ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newmat,&bv);CHKERRQ(ierr); 2053182d2002SSatish Balay 2054182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 20556d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20566d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20570754003eSLois Curfman McInnes 20580754003eSLois Curfman McInnes /* Free work space */ 205978b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 206078b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2061182d2002SSatish Balay *B = newmat; 20623a40ed3dSBarry Smith PetscFunctionReturn(0); 20630754003eSLois Curfman McInnes } 20640754003eSLois Curfman McInnes 20657dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2066905e6a2fSBarry Smith { 20676849ba73SBarry Smith PetscErrorCode ierr; 206813f74950SBarry Smith PetscInt i; 2069905e6a2fSBarry Smith 20703a40ed3dSBarry Smith PetscFunctionBegin; 2071905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2072df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2073905e6a2fSBarry Smith } 2074905e6a2fSBarry Smith 2075905e6a2fSBarry Smith for (i=0; i<n; i++) { 20767dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2077905e6a2fSBarry Smith } 20783a40ed3dSBarry Smith PetscFunctionReturn(0); 2079905e6a2fSBarry Smith } 2080905e6a2fSBarry Smith 2081e0877f53SBarry Smith static PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 2082c0aa2d19SHong Zhang { 2083c0aa2d19SHong Zhang PetscFunctionBegin; 2084c0aa2d19SHong Zhang PetscFunctionReturn(0); 2085c0aa2d19SHong Zhang } 2086c0aa2d19SHong Zhang 2087e0877f53SBarry Smith static PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 2088c0aa2d19SHong Zhang { 2089c0aa2d19SHong Zhang PetscFunctionBegin; 2090c0aa2d19SHong Zhang PetscFunctionReturn(0); 2091c0aa2d19SHong Zhang } 2092c0aa2d19SHong Zhang 2093e0877f53SBarry Smith static PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 20944b0e389bSBarry Smith { 20954b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense*)B->data; 20966849ba73SBarry Smith PetscErrorCode ierr; 2097ca15aa20SStefano Zampini const PetscScalar *va; 2098ca15aa20SStefano Zampini PetscScalar *vb; 2099d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 21003a40ed3dSBarry Smith 21013a40ed3dSBarry Smith PetscFunctionBegin; 210233f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 210333f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 2104cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 21053a40ed3dSBarry Smith PetscFunctionReturn(0); 21063a40ed3dSBarry Smith } 2107e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 2108ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&va);CHKERRQ(ierr); 2109ca15aa20SStefano Zampini ierr = MatDenseGetArray(B,&vb);CHKERRQ(ierr); 2110a5ce6ee0Svictorle if (lda1>m || lda2>m) { 21110dbb7854Svictorle for (j=0; j<n; j++) { 2112ca15aa20SStefano Zampini ierr = PetscArraycpy(vb+j*lda2,va+j*lda1,m);CHKERRQ(ierr); 2113a5ce6ee0Svictorle } 2114a5ce6ee0Svictorle } else { 2115ca15aa20SStefano Zampini ierr = PetscArraycpy(vb,va,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 2116a5ce6ee0Svictorle } 2117ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(B,&vb);CHKERRQ(ierr); 2118ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&va);CHKERRQ(ierr); 2119ca15aa20SStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2120ca15aa20SStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2121273d9f13SBarry Smith PetscFunctionReturn(0); 2122273d9f13SBarry Smith } 2123273d9f13SBarry Smith 2124e0877f53SBarry Smith static PetscErrorCode MatSetUp_SeqDense(Mat A) 2125273d9f13SBarry Smith { 2126dfbe8321SBarry Smith PetscErrorCode ierr; 2127273d9f13SBarry Smith 2128273d9f13SBarry Smith PetscFunctionBegin; 212918992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr); 213018992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr); 213118992e5dSStefano Zampini if (!A->preallocated) { 2132273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 213318992e5dSStefano Zampini } 21343a40ed3dSBarry Smith PetscFunctionReturn(0); 21354b0e389bSBarry Smith } 21364b0e389bSBarry Smith 2137ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 2138ba337c44SJed Brown { 2139ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2140ca15aa20SStefano Zampini PetscScalar *aa; 2141ca15aa20SStefano Zampini PetscErrorCode ierr; 2142ba337c44SJed Brown 2143ba337c44SJed Brown PetscFunctionBegin; 2144ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2145ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 2146ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2147ba337c44SJed Brown PetscFunctionReturn(0); 2148ba337c44SJed Brown } 2149ba337c44SJed Brown 2150ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 2151ba337c44SJed Brown { 2152ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2153ca15aa20SStefano Zampini PetscScalar *aa; 2154ca15aa20SStefano Zampini PetscErrorCode ierr; 2155ba337c44SJed Brown 2156ba337c44SJed Brown PetscFunctionBegin; 2157ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2158ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 2159ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2160ba337c44SJed Brown PetscFunctionReturn(0); 2161ba337c44SJed Brown } 2162ba337c44SJed Brown 2163ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 2164ba337c44SJed Brown { 2165ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2166ca15aa20SStefano Zampini PetscScalar *aa; 2167ca15aa20SStefano Zampini PetscErrorCode ierr; 2168ba337c44SJed Brown 2169ba337c44SJed Brown PetscFunctionBegin; 2170ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2171ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 2172ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2173ba337c44SJed Brown PetscFunctionReturn(0); 2174ba337c44SJed Brown } 2175284134d9SBarry Smith 2176a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 21774222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2178a9fe9ddaSSatish Balay { 2179ee16a9a1SHong Zhang PetscErrorCode ierr; 2180d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 21817a3c3d58SStefano Zampini PetscBool cisdense; 2182a9fe9ddaSSatish Balay 2183ee16a9a1SHong Zhang PetscFunctionBegin; 21844222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 21857a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 21867a3c3d58SStefano Zampini if (!cisdense) { 21877a3c3d58SStefano Zampini PetscBool flg; 21887a3c3d58SStefano Zampini 2189ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 21904222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 21917a3c3d58SStefano Zampini } 219218992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2193ee16a9a1SHong Zhang PetscFunctionReturn(0); 2194ee16a9a1SHong Zhang } 2195a9fe9ddaSSatish Balay 2196a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2197a9fe9ddaSSatish Balay { 219852c5f739Sprj- Mat_SeqDense *a,*b=(Mat_SeqDense*)B->data,*c=(Mat_SeqDense*)C->data; 21990805154bSBarry Smith PetscBLASInt m,n,k; 2200ca15aa20SStefano Zampini const PetscScalar *av,*bv; 2201ca15aa20SStefano Zampini PetscScalar *cv; 2202a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2203fd4e9aacSBarry Smith PetscBool flg; 2204c2916339SPierre Jolivet PetscErrorCode (*numeric)(Mat,Mat,Mat)=NULL; 2205c2916339SPierre Jolivet PetscErrorCode ierr; 2206a9fe9ddaSSatish Balay 2207a9fe9ddaSSatish Balay PetscFunctionBegin; 2208fd4e9aacSBarry Smith /* Handle case where where user provided the final C matrix rather than calling MatMatMult() with MAT_INITIAL_MATRIX*/ 2209fd4e9aacSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&flg);CHKERRQ(ierr); 2210c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqAIJ_SeqDense; 2211a001520aSPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&flg);CHKERRQ(ierr); 2212c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqBAIJ_SeqDense; 2213c2916339SPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&flg);CHKERRQ(ierr); 2214c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqSBAIJ_SeqDense; 221552c5f739Sprj- ierr = PetscObjectTypeCompare((PetscObject)A,MATNEST,&flg);CHKERRQ(ierr); 2216c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_Nest_Dense; 2217c2916339SPierre Jolivet if (numeric) { 2218c2916339SPierre Jolivet C->ops->matmultnumeric = numeric; 2219c2916339SPierre Jolivet ierr = (*numeric)(A,B,C);CHKERRQ(ierr); 222052c5f739Sprj- PetscFunctionReturn(0); 222152c5f739Sprj- } 222252c5f739Sprj- a = (Mat_SeqDense*)A->data; 22238208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 22248208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2225c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 222649d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2227ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2228ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2229ca15aa20SStefano Zampini ierr = MatDenseGetArray(C,&cv);CHKERRQ(ierr); 2230ca15aa20SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2231ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2232ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2233ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2234ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(C,&cv);CHKERRQ(ierr); 2235a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2236a9fe9ddaSSatish Balay } 2237a9fe9ddaSSatish Balay 22384222ddf1SHong Zhang PetscErrorCode MatMatTransposeMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 223969f65d41SStefano Zampini { 224069f65d41SStefano Zampini PetscErrorCode ierr; 224169f65d41SStefano Zampini PetscInt m=A->rmap->n,n=B->rmap->n; 22427a3c3d58SStefano Zampini PetscBool cisdense; 224369f65d41SStefano Zampini 224469f65d41SStefano Zampini PetscFunctionBegin; 22454222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22467a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22477a3c3d58SStefano Zampini if (!cisdense) { 22487a3c3d58SStefano Zampini PetscBool flg; 22497a3c3d58SStefano Zampini 2250ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22514222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22527a3c3d58SStefano Zampini } 225318992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 225469f65d41SStefano Zampini PetscFunctionReturn(0); 225569f65d41SStefano Zampini } 225669f65d41SStefano Zampini 225769f65d41SStefano Zampini PetscErrorCode MatMatTransposeMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 225869f65d41SStefano Zampini { 225969f65d41SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 226069f65d41SStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 226169f65d41SStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)C->data; 226269f65d41SStefano Zampini PetscBLASInt m,n,k; 226369f65d41SStefano Zampini PetscScalar _DOne=1.0,_DZero=0.0; 226469f65d41SStefano Zampini PetscErrorCode ierr; 226569f65d41SStefano Zampini 226669f65d41SStefano Zampini PetscFunctionBegin; 226749d0e964SStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 226849d0e964SStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 226969f65d41SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 227049d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 227169f65d41SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","T",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2272ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 227369f65d41SStefano Zampini PetscFunctionReturn(0); 227469f65d41SStefano Zampini } 227569f65d41SStefano Zampini 22764222ddf1SHong Zhang PetscErrorCode MatTransposeMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2277a9fe9ddaSSatish Balay { 2278ee16a9a1SHong Zhang PetscErrorCode ierr; 2279d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 22807a3c3d58SStefano Zampini PetscBool cisdense; 2281a9fe9ddaSSatish Balay 2282ee16a9a1SHong Zhang PetscFunctionBegin; 22834222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22847a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22857a3c3d58SStefano Zampini if (!cisdense) { 22867a3c3d58SStefano Zampini PetscBool flg; 22877a3c3d58SStefano Zampini 2288ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22894222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22907a3c3d58SStefano Zampini } 229118992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2292ee16a9a1SHong Zhang PetscFunctionReturn(0); 2293ee16a9a1SHong Zhang } 2294a9fe9ddaSSatish Balay 229575648e8dSHong Zhang PetscErrorCode MatTransposeMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2296a9fe9ddaSSatish Balay { 2297a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2298a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2299a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 23000805154bSBarry Smith PetscBLASInt m,n,k; 2301a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2302c5df96a5SBarry Smith PetscErrorCode ierr; 2303a9fe9ddaSSatish Balay 2304a9fe9ddaSSatish Balay PetscFunctionBegin; 23058208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 23068208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2307c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&k);CHKERRQ(ierr); 230849d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 23095ca1cc5dSStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2310ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2311a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2312a9fe9ddaSSatish Balay } 2313985db425SBarry Smith 23144222ddf1SHong Zhang /* ----------------------------------------------- */ 23154222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AB(Mat C) 23164222ddf1SHong Zhang { 23174222ddf1SHong Zhang PetscFunctionBegin; 23184222ddf1SHong Zhang C->ops->matmultsymbolic = MatMatMultSymbolic_SeqDense_SeqDense; 23194222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB; 23204222ddf1SHong Zhang /* dense mat may not call MatProductSymbolic(), thus set C->ops->productnumeric here */ 23214222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 23224222ddf1SHong Zhang PetscFunctionReturn(0); 23234222ddf1SHong Zhang } 23244222ddf1SHong Zhang 23254222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AtB(Mat C) 23264222ddf1SHong Zhang { 23274222ddf1SHong Zhang PetscFunctionBegin; 23284222ddf1SHong Zhang C->ops->transposematmultsymbolic = MatTransposeMatMultSymbolic_SeqDense_SeqDense; 23294222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AtB; 23304222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AtB; 23314222ddf1SHong Zhang PetscFunctionReturn(0); 23324222ddf1SHong Zhang } 23334222ddf1SHong Zhang 23344222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_ABt(Mat C) 23354222ddf1SHong Zhang { 23364222ddf1SHong Zhang PetscFunctionBegin; 23374222ddf1SHong Zhang C->ops->mattransposemultsymbolic = MatMatTransposeMultSymbolic_SeqDense_SeqDense; 23384222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_ABt; 23394222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_ABt; 23404222ddf1SHong Zhang PetscFunctionReturn(0); 23414222ddf1SHong Zhang } 23424222ddf1SHong Zhang 23434222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_PtAP(Mat C) 23444222ddf1SHong Zhang { 23454222ddf1SHong Zhang PetscFunctionBegin; 23464222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_Basic; 23474222ddf1SHong Zhang PetscFunctionReturn(0); 23484222ddf1SHong Zhang } 23494222ddf1SHong Zhang 23504222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqDense(Mat C) 23514222ddf1SHong Zhang { 23524222ddf1SHong Zhang PetscErrorCode ierr; 23534222ddf1SHong Zhang Mat_Product *product = C->product; 23544222ddf1SHong Zhang 23554222ddf1SHong Zhang PetscFunctionBegin; 23564222ddf1SHong Zhang switch (product->type) { 23574222ddf1SHong Zhang case MATPRODUCT_AB: 23584222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AB(C);CHKERRQ(ierr); 23594222ddf1SHong Zhang break; 23604222ddf1SHong Zhang case MATPRODUCT_AtB: 23614222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AtB(C);CHKERRQ(ierr); 23624222ddf1SHong Zhang break; 23634222ddf1SHong Zhang case MATPRODUCT_ABt: 23644222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_ABt(C);CHKERRQ(ierr); 23654222ddf1SHong Zhang break; 23664222ddf1SHong Zhang case MATPRODUCT_PtAP: 23675aae2c7aSStefano Zampini case MATPRODUCT_RARt: 23684222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_PtAP(C);CHKERRQ(ierr); 23694222ddf1SHong Zhang break; 2370544a5e07SHong Zhang default: SETERRQ1(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"MatProduct type %s is not supported for SeqDense and SeqDense matrices",MatProductTypes[product->type]); 23714222ddf1SHong Zhang } 23724222ddf1SHong Zhang PetscFunctionReturn(0); 23734222ddf1SHong Zhang } 23744222ddf1SHong Zhang /* ----------------------------------------------- */ 23754222ddf1SHong Zhang 2376e0877f53SBarry Smith static PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 2377985db425SBarry Smith { 2378985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2379985db425SBarry Smith PetscErrorCode ierr; 2380d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2381985db425SBarry Smith PetscScalar *x; 2382ca15aa20SStefano Zampini const PetscScalar *aa; 2383985db425SBarry Smith 2384985db425SBarry Smith PetscFunctionBegin; 2385e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2386985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2387985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2388ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2389e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2390985db425SBarry Smith for (i=0; i<m; i++) { 2391985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2392985db425SBarry Smith for (j=1; j<n; j++) { 2393ca15aa20SStefano Zampini if (PetscRealPart(x[i]) < PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2394985db425SBarry Smith } 2395985db425SBarry Smith } 2396ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2397985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2398985db425SBarry Smith PetscFunctionReturn(0); 2399985db425SBarry Smith } 2400985db425SBarry Smith 2401e0877f53SBarry Smith static PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 2402985db425SBarry Smith { 2403985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2404985db425SBarry Smith PetscErrorCode ierr; 2405d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2406985db425SBarry Smith PetscScalar *x; 2407985db425SBarry Smith PetscReal atmp; 2408ca15aa20SStefano Zampini const PetscScalar *aa; 2409985db425SBarry Smith 2410985db425SBarry Smith PetscFunctionBegin; 2411e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2412985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2413985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2414ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2415e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2416985db425SBarry Smith for (i=0; i<m; i++) { 24179189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 2418985db425SBarry Smith for (j=1; j<n; j++) { 2419ca15aa20SStefano Zampini atmp = PetscAbsScalar(aa[i+a->lda*j]); 2420985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 2421985db425SBarry Smith } 2422985db425SBarry Smith } 2423ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2424985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2425985db425SBarry Smith PetscFunctionReturn(0); 2426985db425SBarry Smith } 2427985db425SBarry Smith 2428e0877f53SBarry Smith static PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 2429985db425SBarry Smith { 2430985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2431985db425SBarry Smith PetscErrorCode ierr; 2432d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2433985db425SBarry Smith PetscScalar *x; 2434ca15aa20SStefano Zampini const PetscScalar *aa; 2435985db425SBarry Smith 2436985db425SBarry Smith PetscFunctionBegin; 2437e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2438ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2439985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2440985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2441e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2442985db425SBarry Smith for (i=0; i<m; i++) { 2443985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2444985db425SBarry Smith for (j=1; j<n; j++) { 2445ca15aa20SStefano Zampini if (PetscRealPart(x[i]) > PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2446985db425SBarry Smith } 2447985db425SBarry Smith } 2448985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2449ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2450985db425SBarry Smith PetscFunctionReturn(0); 2451985db425SBarry Smith } 2452985db425SBarry Smith 2453637a0070SStefano Zampini PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 24548d0534beSBarry Smith { 24558d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 24568d0534beSBarry Smith PetscErrorCode ierr; 24578d0534beSBarry Smith PetscScalar *x; 2458ca15aa20SStefano Zampini const PetscScalar *aa; 24598d0534beSBarry Smith 24608d0534beSBarry Smith PetscFunctionBegin; 2461e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2462ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 24638d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2464ca15aa20SStefano Zampini ierr = PetscArraycpy(x,aa+col*a->lda,A->rmap->n);CHKERRQ(ierr); 24658d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2466ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 24678d0534beSBarry Smith PetscFunctionReturn(0); 24688d0534beSBarry Smith } 24698d0534beSBarry Smith 247052c5f739Sprj- PETSC_INTERN PetscErrorCode MatGetColumnNorms_SeqDense(Mat A,NormType type,PetscReal *norms) 24710716a85fSBarry Smith { 24720716a85fSBarry Smith PetscErrorCode ierr; 24730716a85fSBarry Smith PetscInt i,j,m,n; 24741683a169SBarry Smith const PetscScalar *a; 24750716a85fSBarry Smith 24760716a85fSBarry Smith PetscFunctionBegin; 24770716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 2478580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 24791683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&a);CHKERRQ(ierr); 24800716a85fSBarry Smith if (type == NORM_2) { 24810716a85fSBarry Smith for (i=0; i<n; i++) { 24820716a85fSBarry Smith for (j=0; j<m; j++) { 24830716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]*a[j]); 24840716a85fSBarry Smith } 24850716a85fSBarry Smith a += m; 24860716a85fSBarry Smith } 24870716a85fSBarry Smith } else if (type == NORM_1) { 24880716a85fSBarry Smith for (i=0; i<n; i++) { 24890716a85fSBarry Smith for (j=0; j<m; j++) { 24900716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]); 24910716a85fSBarry Smith } 24920716a85fSBarry Smith a += m; 24930716a85fSBarry Smith } 24940716a85fSBarry Smith } else if (type == NORM_INFINITY) { 24950716a85fSBarry Smith for (i=0; i<n; i++) { 24960716a85fSBarry Smith for (j=0; j<m; j++) { 24970716a85fSBarry Smith norms[i] = PetscMax(PetscAbsScalar(a[j]),norms[i]); 24980716a85fSBarry Smith } 24990716a85fSBarry Smith a += m; 25000716a85fSBarry Smith } 2501ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Unknown NormType"); 25021683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&a);CHKERRQ(ierr); 25030716a85fSBarry Smith if (type == NORM_2) { 25048f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 25050716a85fSBarry Smith } 25060716a85fSBarry Smith PetscFunctionReturn(0); 25070716a85fSBarry Smith } 25080716a85fSBarry Smith 250973a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqDense(Mat x,PetscRandom rctx) 251073a71a0fSBarry Smith { 251173a71a0fSBarry Smith PetscErrorCode ierr; 251273a71a0fSBarry Smith PetscScalar *a; 2513637a0070SStefano Zampini PetscInt lda,m,n,i,j; 251473a71a0fSBarry Smith 251573a71a0fSBarry Smith PetscFunctionBegin; 251673a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 2517637a0070SStefano Zampini ierr = MatDenseGetLDA(x,&lda);CHKERRQ(ierr); 25188c778c55SBarry Smith ierr = MatDenseGetArray(x,&a);CHKERRQ(ierr); 2519637a0070SStefano Zampini for (j=0; j<n; j++) { 2520637a0070SStefano Zampini for (i=0; i<m; i++) { 2521637a0070SStefano Zampini ierr = PetscRandomGetValue(rctx,a+j*lda+i);CHKERRQ(ierr); 2522637a0070SStefano Zampini } 252373a71a0fSBarry Smith } 25248c778c55SBarry Smith ierr = MatDenseRestoreArray(x,&a);CHKERRQ(ierr); 252573a71a0fSBarry Smith PetscFunctionReturn(0); 252673a71a0fSBarry Smith } 252773a71a0fSBarry Smith 25283b49f96aSBarry Smith static PetscErrorCode MatMissingDiagonal_SeqDense(Mat A,PetscBool *missing,PetscInt *d) 25293b49f96aSBarry Smith { 25303b49f96aSBarry Smith PetscFunctionBegin; 25313b49f96aSBarry Smith *missing = PETSC_FALSE; 25323b49f96aSBarry Smith PetscFunctionReturn(0); 25333b49f96aSBarry Smith } 253473a71a0fSBarry Smith 2535ca15aa20SStefano Zampini /* vals is not const */ 2536af53bab2SHong Zhang static PetscErrorCode MatDenseGetColumn_SeqDense(Mat A,PetscInt col,PetscScalar **vals) 253786aefd0dSHong Zhang { 2538ca15aa20SStefano Zampini PetscErrorCode ierr; 253986aefd0dSHong Zhang Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2540ca15aa20SStefano Zampini PetscScalar *v; 254186aefd0dSHong Zhang 254286aefd0dSHong Zhang PetscFunctionBegin; 254386aefd0dSHong Zhang if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2544ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 2545ca15aa20SStefano Zampini *vals = v+col*a->lda; 2546ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 254786aefd0dSHong Zhang PetscFunctionReturn(0); 254886aefd0dSHong Zhang } 254986aefd0dSHong Zhang 2550af53bab2SHong Zhang static PetscErrorCode MatDenseRestoreColumn_SeqDense(Mat A,PetscScalar **vals) 255186aefd0dSHong Zhang { 255286aefd0dSHong Zhang PetscFunctionBegin; 255386aefd0dSHong Zhang *vals = 0; /* user cannot accidently use the array later */ 255486aefd0dSHong Zhang PetscFunctionReturn(0); 255586aefd0dSHong Zhang } 2556abc3b08eSStefano Zampini 2557289bc588SBarry Smith /* -------------------------------------------------------------------*/ 2558a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqDense, 2559905e6a2fSBarry Smith MatGetRow_SeqDense, 2560905e6a2fSBarry Smith MatRestoreRow_SeqDense, 2561905e6a2fSBarry Smith MatMult_SeqDense, 256297304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 25637c922b88SBarry Smith MatMultTranspose_SeqDense, 25647c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 2565db4efbfdSBarry Smith 0, 2566db4efbfdSBarry Smith 0, 2567db4efbfdSBarry Smith 0, 2568db4efbfdSBarry Smith /* 10*/ 0, 2569905e6a2fSBarry Smith MatLUFactor_SeqDense, 2570905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 257141f059aeSBarry Smith MatSOR_SeqDense, 2572ec8511deSBarry Smith MatTranspose_SeqDense, 257397304618SKris Buschelman /* 15*/ MatGetInfo_SeqDense, 2574905e6a2fSBarry Smith MatEqual_SeqDense, 2575905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 2576905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 2577905e6a2fSBarry Smith MatNorm_SeqDense, 2578c0aa2d19SHong Zhang /* 20*/ MatAssemblyBegin_SeqDense, 2579c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 2580905e6a2fSBarry Smith MatSetOption_SeqDense, 2581905e6a2fSBarry Smith MatZeroEntries_SeqDense, 2582d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqDense, 2583db4efbfdSBarry Smith 0, 2584db4efbfdSBarry Smith 0, 2585db4efbfdSBarry Smith 0, 2586db4efbfdSBarry Smith 0, 25874994cf47SJed Brown /* 29*/ MatSetUp_SeqDense, 2588273d9f13SBarry Smith 0, 2589905e6a2fSBarry Smith 0, 259073a71a0fSBarry Smith 0, 259173a71a0fSBarry Smith 0, 2592d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqDense, 2593a5ae1ecdSBarry Smith 0, 2594a5ae1ecdSBarry Smith 0, 2595a5ae1ecdSBarry Smith 0, 2596a5ae1ecdSBarry Smith 0, 2597d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqDense, 25987dae84e0SHong Zhang MatCreateSubMatrices_SeqDense, 2599a5ae1ecdSBarry Smith 0, 26004b0e389bSBarry Smith MatGetValues_SeqDense, 2601a5ae1ecdSBarry Smith MatCopy_SeqDense, 2602d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqDense, 2603a5ae1ecdSBarry Smith MatScale_SeqDense, 26047d68702bSBarry Smith MatShift_Basic, 2605a5ae1ecdSBarry Smith 0, 26063f49a652SStefano Zampini MatZeroRowsColumns_SeqDense, 260773a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqDense, 2608a5ae1ecdSBarry Smith 0, 2609a5ae1ecdSBarry Smith 0, 2610a5ae1ecdSBarry Smith 0, 2611a5ae1ecdSBarry Smith 0, 2612d519adbfSMatthew Knepley /* 54*/ 0, 2613a5ae1ecdSBarry Smith 0, 2614a5ae1ecdSBarry Smith 0, 2615a5ae1ecdSBarry Smith 0, 2616a5ae1ecdSBarry Smith 0, 2617d519adbfSMatthew Knepley /* 59*/ 0, 2618e03a110bSBarry Smith MatDestroy_SeqDense, 2619e03a110bSBarry Smith MatView_SeqDense, 2620357abbc8SBarry Smith 0, 262197304618SKris Buschelman 0, 2622d519adbfSMatthew Knepley /* 64*/ 0, 262397304618SKris Buschelman 0, 262497304618SKris Buschelman 0, 262597304618SKris Buschelman 0, 262697304618SKris Buschelman 0, 2627d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqDense, 262897304618SKris Buschelman 0, 262997304618SKris Buschelman 0, 263097304618SKris Buschelman 0, 263197304618SKris Buschelman 0, 2632d519adbfSMatthew Knepley /* 74*/ 0, 263397304618SKris Buschelman 0, 263497304618SKris Buschelman 0, 263597304618SKris Buschelman 0, 263697304618SKris Buschelman 0, 2637d519adbfSMatthew Knepley /* 79*/ 0, 263897304618SKris Buschelman 0, 263997304618SKris Buschelman 0, 264097304618SKris Buschelman 0, 26415bba2384SShri Abhyankar /* 83*/ MatLoad_SeqDense, 2642637a0070SStefano Zampini MatIsSymmetric_SeqDense, 26431cbb95d3SBarry Smith MatIsHermitian_SeqDense, 2644865e5f61SKris Buschelman 0, 2645865e5f61SKris Buschelman 0, 2646865e5f61SKris Buschelman 0, 26474222ddf1SHong Zhang /* 89*/ 0, 26484222ddf1SHong Zhang 0, 2649a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 26504222ddf1SHong Zhang 0, 26514222ddf1SHong Zhang 0, 26524222ddf1SHong Zhang /* 94*/ 0, 26534222ddf1SHong Zhang 0, 26544222ddf1SHong Zhang 0, 265569f65d41SStefano Zampini MatMatTransposeMultNumeric_SeqDense_SeqDense, 2656284134d9SBarry Smith 0, 26574222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqDense, 2658284134d9SBarry Smith 0, 2659284134d9SBarry Smith 0, 2660ba337c44SJed Brown MatConjugate_SeqDense, 2661f73d5cc4SBarry Smith 0, 2662ba337c44SJed Brown /*104*/ 0, 2663ba337c44SJed Brown MatRealPart_SeqDense, 2664ba337c44SJed Brown MatImaginaryPart_SeqDense, 2665985db425SBarry Smith 0, 2666985db425SBarry Smith 0, 26678208b9aeSStefano Zampini /*109*/ 0, 2668985db425SBarry Smith 0, 26698d0534beSBarry Smith MatGetRowMin_SeqDense, 2670aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 26713b49f96aSBarry Smith MatMissingDiagonal_SeqDense, 2672aabbc4fbSShri Abhyankar /*114*/ 0, 2673aabbc4fbSShri Abhyankar 0, 2674aabbc4fbSShri Abhyankar 0, 2675aabbc4fbSShri Abhyankar 0, 2676aabbc4fbSShri Abhyankar 0, 2677aabbc4fbSShri Abhyankar /*119*/ 0, 2678aabbc4fbSShri Abhyankar 0, 2679aabbc4fbSShri Abhyankar 0, 26800716a85fSBarry Smith 0, 26810716a85fSBarry Smith 0, 26820716a85fSBarry Smith /*124*/ 0, 26835df89d91SHong Zhang MatGetColumnNorms_SeqDense, 26845df89d91SHong Zhang 0, 26855df89d91SHong Zhang 0, 26865df89d91SHong Zhang 0, 26875df89d91SHong Zhang /*129*/ 0, 26884222ddf1SHong Zhang 0, 26894222ddf1SHong Zhang 0, 269075648e8dSHong Zhang MatTransposeMatMultNumeric_SeqDense_SeqDense, 26913964eb88SJed Brown 0, 26923964eb88SJed Brown /*134*/ 0, 26933964eb88SJed Brown 0, 26943964eb88SJed Brown 0, 26953964eb88SJed Brown 0, 26963964eb88SJed Brown 0, 26973964eb88SJed Brown /*139*/ 0, 2698f9426fe0SMark Adams 0, 2699d528f656SJakub Kruzik 0, 2700d528f656SJakub Kruzik 0, 2701d528f656SJakub Kruzik 0, 27024222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqDense, 27034222ddf1SHong Zhang /*145*/ 0, 27044222ddf1SHong Zhang 0, 27054222ddf1SHong Zhang 0 2706985db425SBarry Smith }; 270790ace30eSBarry Smith 27084b828684SBarry Smith /*@C 2709fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 2710d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 2711d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 2712289bc588SBarry Smith 2713d083f849SBarry Smith Collective 2714db81eaa0SLois Curfman McInnes 271520563c6bSBarry Smith Input Parameters: 2716db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 27170c775827SLois Curfman McInnes . m - number of rows 271818f449edSLois Curfman McInnes . n - number of columns 27190298fd71SBarry Smith - data - optional location of matrix data in column major order. Set data=NULL for PETSc 2720dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 272120563c6bSBarry Smith 272220563c6bSBarry Smith Output Parameter: 272344cd7ae7SLois Curfman McInnes . A - the matrix 272420563c6bSBarry Smith 2725b259b22eSLois Curfman McInnes Notes: 272618f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 272718f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 27280298fd71SBarry Smith set data=NULL. 272918f449edSLois Curfman McInnes 2730027ccd11SLois Curfman McInnes Level: intermediate 2731027ccd11SLois Curfman McInnes 273269b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues() 273320563c6bSBarry Smith @*/ 27347087cfbeSBarry Smith PetscErrorCode MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 2735289bc588SBarry Smith { 2736dfbe8321SBarry Smith PetscErrorCode ierr; 27373b2fbd54SBarry Smith 27383a40ed3dSBarry Smith PetscFunctionBegin; 2739f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 2740f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 2741273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 2742273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 2743273d9f13SBarry Smith PetscFunctionReturn(0); 2744273d9f13SBarry Smith } 2745273d9f13SBarry Smith 2746273d9f13SBarry Smith /*@C 2747273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 2748273d9f13SBarry Smith 2749d083f849SBarry Smith Collective 2750273d9f13SBarry Smith 2751273d9f13SBarry Smith Input Parameters: 27521c4f3114SJed Brown + B - the matrix 27530298fd71SBarry Smith - data - the array (or NULL) 2754273d9f13SBarry Smith 2755273d9f13SBarry Smith Notes: 2756273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 2757273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 2758284134d9SBarry Smith need not call this routine. 2759273d9f13SBarry Smith 2760273d9f13SBarry Smith Level: intermediate 2761273d9f13SBarry Smith 2762*ad16ce7aSStefano Zampini .seealso: MatCreate(), MatCreateDense(), MatSetValues(), MatDenseSetLDA() 2763867c911aSBarry Smith 2764273d9f13SBarry Smith @*/ 27657087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 2766273d9f13SBarry Smith { 27674ac538c5SBarry Smith PetscErrorCode ierr; 2768a23d5eceSKris Buschelman 2769a23d5eceSKris Buschelman PetscFunctionBegin; 2770d5ea218eSStefano Zampini PetscValidHeaderSpecific(B,MAT_CLASSID,1); 27714ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 2772a23d5eceSKris Buschelman PetscFunctionReturn(0); 2773a23d5eceSKris Buschelman } 2774a23d5eceSKris Buschelman 27757087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 2776a23d5eceSKris Buschelman { 2777*ad16ce7aSStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2778dfbe8321SBarry Smith PetscErrorCode ierr; 2779273d9f13SBarry Smith 2780273d9f13SBarry Smith PetscFunctionBegin; 2781273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 2782a868139aSShri Abhyankar 278334ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 278434ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 278534ef9618SShri Abhyankar 2786*ad16ce7aSStefano Zampini if (b->lda <= 0) b->lda = B->rmap->n; 278786d161a7SShri Abhyankar 2788*ad16ce7aSStefano Zampini ierr = PetscIntMultError(b->lda,B->cmap->n,NULL);CHKERRQ(ierr); 27899e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 27909e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2791*ad16ce7aSStefano Zampini ierr = PetscCalloc1((size_t)b->lda*B->cmap->n,&b->v);CHKERRQ(ierr); 2792*ad16ce7aSStefano Zampini ierr = PetscLogObjectMemory((PetscObject)B,b->lda*B->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 27932205254eSKarl Rupp 27949e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 2795273d9f13SBarry Smith } else { /* user-allocated storage */ 27969e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2797273d9f13SBarry Smith b->v = data; 2798273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2799273d9f13SBarry Smith } 28000450473dSBarry Smith B->assembled = PETSC_TRUE; 2801273d9f13SBarry Smith PetscFunctionReturn(0); 2802273d9f13SBarry Smith } 2803273d9f13SBarry Smith 280465b80a83SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2805cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_Elemental(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 28068baccfbdSHong Zhang { 2807d77f618aSHong Zhang Mat mat_elemental; 2808d77f618aSHong Zhang PetscErrorCode ierr; 28091683a169SBarry Smith const PetscScalar *array; 28101683a169SBarry Smith PetscScalar *v_colwise; 2811d77f618aSHong Zhang PetscInt M=A->rmap->N,N=A->cmap->N,i,j,k,*rows,*cols; 2812d77f618aSHong Zhang 28138baccfbdSHong Zhang PetscFunctionBegin; 2814d77f618aSHong Zhang ierr = PetscMalloc3(M*N,&v_colwise,M,&rows,N,&cols);CHKERRQ(ierr); 28151683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&array);CHKERRQ(ierr); 2816d77f618aSHong Zhang /* convert column-wise array into row-wise v_colwise, see MatSetValues_Elemental() */ 2817d77f618aSHong Zhang k = 0; 2818d77f618aSHong Zhang for (j=0; j<N; j++) { 2819d77f618aSHong Zhang cols[j] = j; 2820d77f618aSHong Zhang for (i=0; i<M; i++) { 2821d77f618aSHong Zhang v_colwise[j*M+i] = array[k++]; 2822d77f618aSHong Zhang } 2823d77f618aSHong Zhang } 2824d77f618aSHong Zhang for (i=0; i<M; i++) { 2825d77f618aSHong Zhang rows[i] = i; 2826d77f618aSHong Zhang } 28271683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&array);CHKERRQ(ierr); 2828d77f618aSHong Zhang 2829d77f618aSHong Zhang ierr = MatCreate(PetscObjectComm((PetscObject)A), &mat_elemental);CHKERRQ(ierr); 2830d77f618aSHong Zhang ierr = MatSetSizes(mat_elemental,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2831d77f618aSHong Zhang ierr = MatSetType(mat_elemental,MATELEMENTAL);CHKERRQ(ierr); 2832d77f618aSHong Zhang ierr = MatSetUp(mat_elemental);CHKERRQ(ierr); 2833d77f618aSHong Zhang 2834d77f618aSHong Zhang /* PETSc-Elemental interaface uses axpy for setting off-processor entries, only ADD_VALUES is allowed */ 2835d77f618aSHong Zhang ierr = MatSetValues(mat_elemental,M,rows,N,cols,v_colwise,ADD_VALUES);CHKERRQ(ierr); 2836d77f618aSHong Zhang ierr = MatAssemblyBegin(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2837d77f618aSHong Zhang ierr = MatAssemblyEnd(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2838d77f618aSHong Zhang ierr = PetscFree3(v_colwise,rows,cols);CHKERRQ(ierr); 2839d77f618aSHong Zhang 2840511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 284128be2f97SBarry Smith ierr = MatHeaderReplace(A,&mat_elemental);CHKERRQ(ierr); 2842d77f618aSHong Zhang } else { 2843d77f618aSHong Zhang *newmat = mat_elemental; 2844d77f618aSHong Zhang } 28458baccfbdSHong Zhang PetscFunctionReturn(0); 28468baccfbdSHong Zhang } 284765b80a83SHong Zhang #endif 28488baccfbdSHong Zhang 2849*ad16ce7aSStefano Zampini static PetscErrorCode MatDenseSetLDA_SeqDense(Mat B,PetscInt lda) 28501b807ce4Svictorle { 28511b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 285221a2c019SBarry Smith 28531b807ce4Svictorle PetscFunctionBegin; 2854e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 28551b807ce4Svictorle b->lda = lda; 28561b807ce4Svictorle PetscFunctionReturn(0); 28571b807ce4Svictorle } 28581b807ce4Svictorle 2859d528f656SJakub Kruzik PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqDense(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 2860d528f656SJakub Kruzik { 2861d528f656SJakub Kruzik PetscErrorCode ierr; 2862d528f656SJakub Kruzik PetscMPIInt size; 2863d528f656SJakub Kruzik 2864d528f656SJakub Kruzik PetscFunctionBegin; 2865d528f656SJakub Kruzik ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 2866d528f656SJakub Kruzik if (size == 1) { 2867d528f656SJakub Kruzik if (scall == MAT_INITIAL_MATRIX) { 2868d528f656SJakub Kruzik ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 2869d528f656SJakub Kruzik } else { 2870d528f656SJakub Kruzik ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2871d528f656SJakub Kruzik } 2872d528f656SJakub Kruzik } else { 2873d528f656SJakub Kruzik ierr = MatCreateMPIMatConcatenateSeqMat_MPIDense(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 2874d528f656SJakub Kruzik } 2875d528f656SJakub Kruzik PetscFunctionReturn(0); 2876d528f656SJakub Kruzik } 2877d528f656SJakub Kruzik 28786947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28796947451fSStefano Zampini { 28806947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28816947451fSStefano Zampini PetscErrorCode ierr; 28826947451fSStefano Zampini 28836947451fSStefano Zampini PetscFunctionBegin; 28846947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 28856947451fSStefano Zampini if (!a->cvec) { 28866947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 28876947451fSStefano Zampini } 28886947451fSStefano Zampini a->vecinuse = col + 1; 28896947451fSStefano Zampini ierr = MatDenseGetArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 28906947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 28916947451fSStefano Zampini *v = a->cvec; 28926947451fSStefano Zampini PetscFunctionReturn(0); 28936947451fSStefano Zampini } 28946947451fSStefano Zampini 28956947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28966947451fSStefano Zampini { 28976947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28986947451fSStefano Zampini PetscErrorCode ierr; 28996947451fSStefano Zampini 29006947451fSStefano Zampini PetscFunctionBegin; 29016947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29026947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29036947451fSStefano Zampini a->vecinuse = 0; 29046947451fSStefano Zampini ierr = MatDenseRestoreArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29056947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29066947451fSStefano Zampini *v = NULL; 29076947451fSStefano Zampini PetscFunctionReturn(0); 29086947451fSStefano Zampini } 29096947451fSStefano Zampini 29106947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 29116947451fSStefano Zampini { 29126947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29136947451fSStefano Zampini PetscErrorCode ierr; 29146947451fSStefano Zampini 29156947451fSStefano Zampini PetscFunctionBegin; 29166947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 29176947451fSStefano Zampini if (!a->cvec) { 29186947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 29196947451fSStefano Zampini } 29206947451fSStefano Zampini a->vecinuse = col + 1; 29216947451fSStefano Zampini ierr = MatDenseGetArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 29226947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 29236947451fSStefano Zampini ierr = VecLockReadPush(a->cvec);CHKERRQ(ierr); 29246947451fSStefano Zampini *v = a->cvec; 29256947451fSStefano Zampini PetscFunctionReturn(0); 29266947451fSStefano Zampini } 29276947451fSStefano Zampini 29286947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 29296947451fSStefano Zampini { 29306947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29316947451fSStefano Zampini PetscErrorCode ierr; 29326947451fSStefano Zampini 29336947451fSStefano Zampini PetscFunctionBegin; 29346947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29356947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29366947451fSStefano Zampini a->vecinuse = 0; 29376947451fSStefano Zampini ierr = MatDenseRestoreArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 29386947451fSStefano Zampini ierr = VecLockReadPop(a->cvec);CHKERRQ(ierr); 29396947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29406947451fSStefano Zampini *v = NULL; 29416947451fSStefano Zampini PetscFunctionReturn(0); 29426947451fSStefano Zampini } 29436947451fSStefano Zampini 29446947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29456947451fSStefano Zampini { 29466947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29476947451fSStefano Zampini PetscErrorCode ierr; 29486947451fSStefano Zampini 29496947451fSStefano Zampini PetscFunctionBegin; 29506947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 29516947451fSStefano Zampini if (!a->cvec) { 29526947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 29536947451fSStefano Zampini } 29546947451fSStefano Zampini a->vecinuse = col + 1; 29556947451fSStefano Zampini ierr = MatDenseGetArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29566947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 29576947451fSStefano Zampini *v = a->cvec; 29586947451fSStefano Zampini PetscFunctionReturn(0); 29596947451fSStefano Zampini } 29606947451fSStefano Zampini 29616947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29626947451fSStefano Zampini { 29636947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29646947451fSStefano Zampini PetscErrorCode ierr; 29656947451fSStefano Zampini 29666947451fSStefano Zampini PetscFunctionBegin; 29676947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29686947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29696947451fSStefano Zampini a->vecinuse = 0; 29706947451fSStefano Zampini ierr = MatDenseRestoreArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29716947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29726947451fSStefano Zampini *v = NULL; 29736947451fSStefano Zampini PetscFunctionReturn(0); 29746947451fSStefano Zampini } 29756947451fSStefano Zampini 29760bad9183SKris Buschelman /*MC 2977fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 29780bad9183SKris Buschelman 29790bad9183SKris Buschelman Options Database Keys: 29800bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 29810bad9183SKris Buschelman 29820bad9183SKris Buschelman Level: beginner 29830bad9183SKris Buschelman 298489665df3SBarry Smith .seealso: MatCreateSeqDense() 298589665df3SBarry Smith 29860bad9183SKris Buschelman M*/ 2987ca15aa20SStefano Zampini PetscErrorCode MatCreate_SeqDense(Mat B) 2988273d9f13SBarry Smith { 2989273d9f13SBarry Smith Mat_SeqDense *b; 2990dfbe8321SBarry Smith PetscErrorCode ierr; 29917c334f02SBarry Smith PetscMPIInt size; 2992273d9f13SBarry Smith 2993273d9f13SBarry Smith PetscFunctionBegin; 2994ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 2995e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 299655659b69SBarry Smith 2997b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 2998549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 299944cd7ae7SLois Curfman McInnes B->data = (void*)b; 300018f449edSLois Curfman McInnes 3001273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 30024e220ebcSLois Curfman McInnes 300349a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetLDA_C",MatDenseGetLDA_SeqDense);CHKERRQ(ierr); 3004*ad16ce7aSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseSetLDA_C",MatDenseSetLDA_SeqDense);CHKERRQ(ierr); 3005bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArray_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 30068572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArray_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 3007d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDensePlaceArray_C",MatDensePlaceArray_SeqDense);CHKERRQ(ierr); 3008d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseResetArray_C",MatDenseResetArray_SeqDense);CHKERRQ(ierr); 3009d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseReplaceArray_C",MatDenseReplaceArray_SeqDense);CHKERRQ(ierr); 30108572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayRead_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 3011715b7558SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayRead_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 30126947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayWrite_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 30136947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayWrite_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 3014bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqaij_C",MatConvert_SeqDense_SeqAIJ);CHKERRQ(ierr); 30158baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30168baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_elemental_C",MatConvert_SeqDense_Elemental);CHKERRQ(ierr); 30178baccfbdSHong Zhang #endif 30182bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 30192bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqdensecuda_C",MatConvert_SeqDense_SeqDenseCUDA);CHKERRQ(ierr); 30204222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 30214222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 3022637a0070SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 30234222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 30242bf066beSStefano Zampini #endif 3025bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqDenseSetPreallocation_C",MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 30264222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 30274222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 3028bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaij_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3029bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaij_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 30304222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 3031a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqbaij_seqdense_C",MatMatMultSymbolic_SeqBAIJ_SeqDense);CHKERRQ(ierr); 3032a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqbaij_seqdense_C",MatMatMultNumeric_SeqBAIJ_SeqDense);CHKERRQ(ierr); 30334222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqsbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 3034c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqsbaij_seqdense_C",MatMatMultSymbolic_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 3035c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqsbaij_seqdense_C",MatMatMultNumeric_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 30364099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijperm_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30374099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijperm_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3038e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijsell_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3039e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijsell_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 304096e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijmkl_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 304196e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijmkl_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 304252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_nest_seqdense_C",MatMatMultSymbolic_Nest_Dense);CHKERRQ(ierr); 304352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_nest_seqdense_C",MatMatMultNumeric_Nest_Dense);CHKERRQ(ierr); 304496e6d5c4SRichard Tran Mills 30453bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30463bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaij_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 30474099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30484099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3049e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3050e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 305196e6d5c4SRichard Tran Mills 305296e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 305396e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3054af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumn_C",MatDenseGetColumn_SeqDense);CHKERRQ(ierr); 3055af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumn_C",MatDenseRestoreColumn_SeqDense);CHKERRQ(ierr); 30566947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVec_C",MatDenseGetColumnVec_SeqDense);CHKERRQ(ierr); 30576947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVec_C",MatDenseRestoreColumnVec_SeqDense);CHKERRQ(ierr); 30586947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecRead_C",MatDenseGetColumnVecRead_SeqDense);CHKERRQ(ierr); 30596947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecRead_C",MatDenseRestoreColumnVecRead_SeqDense);CHKERRQ(ierr); 30606947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecWrite_C",MatDenseGetColumnVecWrite_SeqDense);CHKERRQ(ierr); 30616947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecWrite_C",MatDenseRestoreColumnVecWrite_SeqDense);CHKERRQ(ierr); 306217667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 30633a40ed3dSBarry Smith PetscFunctionReturn(0); 3064289bc588SBarry Smith } 306586aefd0dSHong Zhang 306686aefd0dSHong Zhang /*@C 3067af53bab2SHong Zhang MatDenseGetColumn - gives access to a column of a dense matrix. This is only the local part of the column. You MUST call MatDenseRestoreColumn() to avoid memory bleeding. 306886aefd0dSHong Zhang 306986aefd0dSHong Zhang Not Collective 307086aefd0dSHong Zhang 307186aefd0dSHong Zhang Input Parameter: 307286aefd0dSHong Zhang + mat - a MATSEQDENSE or MATMPIDENSE matrix 307386aefd0dSHong Zhang - col - column index 307486aefd0dSHong Zhang 307586aefd0dSHong Zhang Output Parameter: 307686aefd0dSHong Zhang . vals - pointer to the data 307786aefd0dSHong Zhang 307886aefd0dSHong Zhang Level: intermediate 307986aefd0dSHong Zhang 308086aefd0dSHong Zhang .seealso: MatDenseRestoreColumn() 308186aefd0dSHong Zhang @*/ 308286aefd0dSHong Zhang PetscErrorCode MatDenseGetColumn(Mat A,PetscInt col,PetscScalar **vals) 308386aefd0dSHong Zhang { 308486aefd0dSHong Zhang PetscErrorCode ierr; 308586aefd0dSHong Zhang 308686aefd0dSHong Zhang PetscFunctionBegin; 3087d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3088d5ea218eSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 3089d5ea218eSStefano Zampini PetscValidPointer(vals,3); 309086aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseGetColumn_C",(Mat,PetscInt,PetscScalar**),(A,col,vals));CHKERRQ(ierr); 309186aefd0dSHong Zhang PetscFunctionReturn(0); 309286aefd0dSHong Zhang } 309386aefd0dSHong Zhang 309486aefd0dSHong Zhang /*@C 309586aefd0dSHong Zhang MatDenseRestoreColumn - returns access to a column of a dense matrix which is returned by MatDenseGetColumn(). 309686aefd0dSHong Zhang 309786aefd0dSHong Zhang Not Collective 309886aefd0dSHong Zhang 309986aefd0dSHong Zhang Input Parameter: 310086aefd0dSHong Zhang . mat - a MATSEQDENSE or MATMPIDENSE matrix 310186aefd0dSHong Zhang 310286aefd0dSHong Zhang Output Parameter: 310386aefd0dSHong Zhang . vals - pointer to the data 310486aefd0dSHong Zhang 310586aefd0dSHong Zhang Level: intermediate 310686aefd0dSHong Zhang 310786aefd0dSHong Zhang .seealso: MatDenseGetColumn() 310886aefd0dSHong Zhang @*/ 310986aefd0dSHong Zhang PetscErrorCode MatDenseRestoreColumn(Mat A,PetscScalar **vals) 311086aefd0dSHong Zhang { 311186aefd0dSHong Zhang PetscErrorCode ierr; 311286aefd0dSHong Zhang 311386aefd0dSHong Zhang PetscFunctionBegin; 3114d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3115d5ea218eSStefano Zampini PetscValidPointer(vals,2); 311686aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseRestoreColumn_C",(Mat,PetscScalar**),(A,vals));CHKERRQ(ierr); 311786aefd0dSHong Zhang PetscFunctionReturn(0); 311886aefd0dSHong Zhang } 31196947451fSStefano Zampini 31206947451fSStefano Zampini /*@C 31216947451fSStefano Zampini MatDenseGetColumnVec - Gives read-write access to a column of a dense matrix, represented as a Vec. 31226947451fSStefano Zampini 31236947451fSStefano Zampini Collective 31246947451fSStefano Zampini 31256947451fSStefano Zampini Input Parameter: 31266947451fSStefano Zampini + mat - the Mat object 31276947451fSStefano Zampini - col - the column index 31286947451fSStefano Zampini 31296947451fSStefano Zampini Output Parameter: 31306947451fSStefano Zampini . v - the vector 31316947451fSStefano Zampini 31326947451fSStefano Zampini Notes: 31336947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVec() when the vector is no longer needed. 31346947451fSStefano Zampini Use MatDenseGetColumnVecRead() to obtain read-only access or MatDenseGetColumnVecWrite() for write-only access. 31356947451fSStefano Zampini 31366947451fSStefano Zampini Level: intermediate 31376947451fSStefano Zampini 31386947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31396947451fSStefano Zampini @*/ 31406947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec(Mat A,PetscInt col,Vec *v) 31416947451fSStefano Zampini { 31426947451fSStefano Zampini PetscErrorCode ierr; 31436947451fSStefano Zampini 31446947451fSStefano Zampini PetscFunctionBegin; 31456947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31466947451fSStefano Zampini PetscValidType(A,1); 31476947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31486947451fSStefano Zampini PetscValidPointer(v,3); 31496947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31506947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31516947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31526947451fSStefano Zampini PetscFunctionReturn(0); 31536947451fSStefano Zampini } 31546947451fSStefano Zampini 31556947451fSStefano Zampini /*@C 31566947451fSStefano Zampini MatDenseRestoreColumnVec - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVec(). 31576947451fSStefano Zampini 31586947451fSStefano Zampini Collective 31596947451fSStefano Zampini 31606947451fSStefano Zampini Input Parameter: 31616947451fSStefano Zampini + mat - the Mat object 31626947451fSStefano Zampini . col - the column index 31636947451fSStefano Zampini - v - the Vec object 31646947451fSStefano Zampini 31656947451fSStefano Zampini Level: intermediate 31666947451fSStefano Zampini 31676947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31686947451fSStefano Zampini @*/ 31696947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec(Mat A,PetscInt col,Vec *v) 31706947451fSStefano Zampini { 31716947451fSStefano Zampini PetscErrorCode ierr; 31726947451fSStefano Zampini 31736947451fSStefano Zampini PetscFunctionBegin; 31746947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31756947451fSStefano Zampini PetscValidType(A,1); 31766947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31776947451fSStefano Zampini PetscValidPointer(v,3); 31786947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31796947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31806947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31816947451fSStefano Zampini PetscFunctionReturn(0); 31826947451fSStefano Zampini } 31836947451fSStefano Zampini 31846947451fSStefano Zampini /*@C 31856947451fSStefano Zampini MatDenseGetColumnVecRead - Gives read-only access to a column of a dense matrix, represented as a Vec. 31866947451fSStefano Zampini 31876947451fSStefano Zampini Collective 31886947451fSStefano Zampini 31896947451fSStefano Zampini Input Parameter: 31906947451fSStefano Zampini + mat - the Mat object 31916947451fSStefano Zampini - col - the column index 31926947451fSStefano Zampini 31936947451fSStefano Zampini Output Parameter: 31946947451fSStefano Zampini . v - the vector 31956947451fSStefano Zampini 31966947451fSStefano Zampini Notes: 31976947451fSStefano Zampini The vector is owned by PETSc and users cannot modify it. 31986947451fSStefano Zampini Users need to call MatDenseRestoreColumnVecRead() when the vector is no longer needed. 31996947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecWrite() for write-only access. 32006947451fSStefano Zampini 32016947451fSStefano Zampini Level: intermediate 32026947451fSStefano Zampini 32036947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 32046947451fSStefano Zampini @*/ 32056947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead(Mat A,PetscInt col,Vec *v) 32066947451fSStefano Zampini { 32076947451fSStefano Zampini PetscErrorCode ierr; 32086947451fSStefano Zampini 32096947451fSStefano Zampini PetscFunctionBegin; 32106947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32116947451fSStefano Zampini PetscValidType(A,1); 32126947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32136947451fSStefano Zampini PetscValidPointer(v,3); 32146947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32156947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32166947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32176947451fSStefano Zampini PetscFunctionReturn(0); 32186947451fSStefano Zampini } 32196947451fSStefano Zampini 32206947451fSStefano Zampini /*@C 32216947451fSStefano Zampini MatDenseRestoreColumnVecRead - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecRead(). 32226947451fSStefano Zampini 32236947451fSStefano Zampini Collective 32246947451fSStefano Zampini 32256947451fSStefano Zampini Input Parameter: 32266947451fSStefano Zampini + mat - the Mat object 32276947451fSStefano Zampini . col - the column index 32286947451fSStefano Zampini - v - the Vec object 32296947451fSStefano Zampini 32306947451fSStefano Zampini Level: intermediate 32316947451fSStefano Zampini 32326947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecWrite() 32336947451fSStefano Zampini @*/ 32346947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead(Mat A,PetscInt col,Vec *v) 32356947451fSStefano Zampini { 32366947451fSStefano Zampini PetscErrorCode ierr; 32376947451fSStefano Zampini 32386947451fSStefano Zampini PetscFunctionBegin; 32396947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32406947451fSStefano Zampini PetscValidType(A,1); 32416947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32426947451fSStefano Zampini PetscValidPointer(v,3); 32436947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32446947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32456947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32466947451fSStefano Zampini PetscFunctionReturn(0); 32476947451fSStefano Zampini } 32486947451fSStefano Zampini 32496947451fSStefano Zampini /*@C 32506947451fSStefano Zampini MatDenseGetColumnVecWrite - Gives write-only access to a column of a dense matrix, represented as a Vec. 32516947451fSStefano Zampini 32526947451fSStefano Zampini Collective 32536947451fSStefano Zampini 32546947451fSStefano Zampini Input Parameter: 32556947451fSStefano Zampini + mat - the Mat object 32566947451fSStefano Zampini - col - the column index 32576947451fSStefano Zampini 32586947451fSStefano Zampini Output Parameter: 32596947451fSStefano Zampini . v - the vector 32606947451fSStefano Zampini 32616947451fSStefano Zampini Notes: 32626947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVecWrite() when the vector is no longer needed. 32636947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecRead() for read-only access. 32646947451fSStefano Zampini 32656947451fSStefano Zampini Level: intermediate 32666947451fSStefano Zampini 32676947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 32686947451fSStefano Zampini @*/ 32696947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite(Mat A,PetscInt col,Vec *v) 32706947451fSStefano Zampini { 32716947451fSStefano Zampini PetscErrorCode ierr; 32726947451fSStefano Zampini 32736947451fSStefano Zampini PetscFunctionBegin; 32746947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32756947451fSStefano Zampini PetscValidType(A,1); 32766947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32776947451fSStefano Zampini PetscValidPointer(v,3); 32786947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32796947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32806947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32816947451fSStefano Zampini PetscFunctionReturn(0); 32826947451fSStefano Zampini } 32836947451fSStefano Zampini 32846947451fSStefano Zampini /*@C 32856947451fSStefano Zampini MatDenseRestoreColumnVecWrite - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecWrite(). 32866947451fSStefano Zampini 32876947451fSStefano Zampini Collective 32886947451fSStefano Zampini 32896947451fSStefano Zampini Input Parameter: 32906947451fSStefano Zampini + mat - the Mat object 32916947451fSStefano Zampini . col - the column index 32926947451fSStefano Zampini - v - the Vec object 32936947451fSStefano Zampini 32946947451fSStefano Zampini Level: intermediate 32956947451fSStefano Zampini 32966947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead() 32976947451fSStefano Zampini @*/ 32986947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite(Mat A,PetscInt col,Vec *v) 32996947451fSStefano Zampini { 33006947451fSStefano Zampini PetscErrorCode ierr; 33016947451fSStefano Zampini 33026947451fSStefano Zampini PetscFunctionBegin; 33036947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 33046947451fSStefano Zampini PetscValidType(A,1); 33056947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 33066947451fSStefano Zampini PetscValidPointer(v,3); 33076947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 33086947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 33096947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 33106947451fSStefano Zampini PetscFunctionReturn(0); 33116947451fSStefano Zampini } 3312