1be1d678aSKris Buschelman 267e560aaSBarry Smith /* 367e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 467e560aaSBarry Smith */ 5289bc588SBarry Smith 6dec5eb66SMatthew G Knepley #include <../src/mat/impls/dense/seq/dense.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8289bc588SBarry Smith 96a63e612SBarry Smith #include <../src/mat/impls/aij/seq/aij.h> 10b2573a8aSBarry Smith 11ca15aa20SStefano Zampini PetscErrorCode MatSeqDenseSymmetrize_Private(Mat A, PetscBool hermitian) 128c178816SStefano Zampini { 138c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 148c178816SStefano Zampini PetscInt j, k, n = A->rmap->n; 15ca15aa20SStefano Zampini PetscScalar *v; 16ca15aa20SStefano Zampini PetscErrorCode ierr; 178c178816SStefano Zampini 188c178816SStefano Zampini PetscFunctionBegin; 198c178816SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot symmetrize a rectangular matrix"); 20ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 218c178816SStefano Zampini if (!hermitian) { 228c178816SStefano Zampini for (k=0;k<n;k++) { 238c178816SStefano Zampini for (j=k;j<n;j++) { 24ca15aa20SStefano Zampini v[j*mat->lda + k] = v[k*mat->lda + j]; 258c178816SStefano Zampini } 268c178816SStefano Zampini } 278c178816SStefano Zampini } else { 288c178816SStefano Zampini for (k=0;k<n;k++) { 298c178816SStefano Zampini for (j=k;j<n;j++) { 30ca15aa20SStefano Zampini v[j*mat->lda + k] = PetscConj(v[k*mat->lda + j]); 318c178816SStefano Zampini } 328c178816SStefano Zampini } 338c178816SStefano Zampini } 34ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 358c178816SStefano Zampini PetscFunctionReturn(0); 368c178816SStefano Zampini } 378c178816SStefano Zampini 3805709791SSatish Balay PETSC_EXTERN PetscErrorCode MatSeqDenseInvertFactors_Private(Mat A) 398c178816SStefano Zampini { 408c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 418c178816SStefano Zampini PetscErrorCode ierr; 428c178816SStefano Zampini PetscBLASInt info,n; 438c178816SStefano Zampini 448c178816SStefano Zampini PetscFunctionBegin; 458c178816SStefano Zampini if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 468c178816SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 478c178816SStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 488c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 498c178816SStefano Zampini if (!mat->fwork) { 508c178816SStefano Zampini mat->lfwork = n; 518c178816SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 528c178816SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 538c178816SStefano Zampini } 5400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 558c178816SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 5600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 588c178816SStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 598c178816SStefano Zampini if (A->spd) { 6000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 618c178816SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_("L",&n,mat->v,&mat->lda,&info)); 6200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 638c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 648c178816SStefano Zampini #if defined(PETSC_USE_COMPLEX) 658c178816SStefano Zampini } else if (A->hermitian) { 668c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 678c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 6800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 698c178816SStefano Zampini PetscStackCallBLAS("LAPACKhetri",LAPACKhetri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 718c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 728c178816SStefano Zampini #endif 738c178816SStefano Zampini } else { /* symmetric case */ 748c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 758c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 7600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 778c178816SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 798c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_FALSE);CHKERRQ(ierr); 808c178816SStefano Zampini } 818c178816SStefano Zampini if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad Inversion: zero pivot in row %D",(PetscInt)info-1); 82ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 838c178816SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 848c178816SStefano Zampini 858c178816SStefano Zampini A->ops->solve = NULL; 868c178816SStefano Zampini A->ops->matsolve = NULL; 878c178816SStefano Zampini A->ops->solvetranspose = NULL; 888c178816SStefano Zampini A->ops->matsolvetranspose = NULL; 898c178816SStefano Zampini A->ops->solveadd = NULL; 908c178816SStefano Zampini A->ops->solvetransposeadd = NULL; 918c178816SStefano Zampini A->factortype = MAT_FACTOR_NONE; 928c178816SStefano Zampini ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 938c178816SStefano Zampini PetscFunctionReturn(0); 948c178816SStefano Zampini } 958c178816SStefano Zampini 963f49a652SStefano Zampini PetscErrorCode MatZeroRowsColumns_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 973f49a652SStefano Zampini { 983f49a652SStefano Zampini PetscErrorCode ierr; 993f49a652SStefano Zampini Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1003f49a652SStefano Zampini PetscInt m = l->lda, n = A->cmap->n,r = A->rmap->n, i,j; 101ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 1023f49a652SStefano Zampini const PetscScalar *xx; 1033f49a652SStefano Zampini 1043f49a652SStefano Zampini PetscFunctionBegin; 10576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1063f49a652SStefano Zampini for (i=0; i<N; i++) { 1073f49a652SStefano Zampini if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1083f49a652SStefano Zampini if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1093f49a652SStefano Zampini if (rows[i] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Col %D requested to be zeroed greater than or equal number of cols %D",rows[i],A->cmap->n); 1103f49a652SStefano Zampini } 11176bd3646SJed Brown } 112ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1133f49a652SStefano Zampini 1143f49a652SStefano Zampini /* fix right hand side if needed */ 1153f49a652SStefano Zampini if (x && b) { 1166c4d906cSStefano Zampini Vec xt; 1176c4d906cSStefano Zampini 1186c4d906cSStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1196c4d906cSStefano Zampini ierr = VecDuplicate(x,&xt);CHKERRQ(ierr); 1206c4d906cSStefano Zampini ierr = VecCopy(x,xt);CHKERRQ(ierr); 1216c4d906cSStefano Zampini ierr = VecScale(xt,-1.0);CHKERRQ(ierr); 1226c4d906cSStefano Zampini ierr = MatMultAdd(A,xt,b,b);CHKERRQ(ierr); 1236c4d906cSStefano Zampini ierr = VecDestroy(&xt);CHKERRQ(ierr); 1243f49a652SStefano Zampini ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 1253f49a652SStefano Zampini ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 1263f49a652SStefano Zampini for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 1273f49a652SStefano Zampini ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 1283f49a652SStefano Zampini ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 1293f49a652SStefano Zampini } 1303f49a652SStefano Zampini 131ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1323f49a652SStefano Zampini for (i=0; i<N; i++) { 133ca15aa20SStefano Zampini slot = v + rows[i]*m; 134580bdb30SBarry Smith ierr = PetscArrayzero(slot,r);CHKERRQ(ierr); 1353f49a652SStefano Zampini } 1363f49a652SStefano Zampini for (i=0; i<N; i++) { 137ca15aa20SStefano Zampini slot = v + rows[i]; 1383f49a652SStefano Zampini for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 1393f49a652SStefano Zampini } 1403f49a652SStefano Zampini if (diag != 0.0) { 1413f49a652SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1423f49a652SStefano Zampini for (i=0; i<N; i++) { 143ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1443f49a652SStefano Zampini *slot = diag; 1453f49a652SStefano Zampini } 1463f49a652SStefano Zampini } 147ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 1483f49a652SStefano Zampini PetscFunctionReturn(0); 1493f49a652SStefano Zampini } 1503f49a652SStefano Zampini 151abc3b08eSStefano Zampini PetscErrorCode MatPtAPNumeric_SeqDense_SeqDense(Mat A,Mat P,Mat C) 152abc3b08eSStefano Zampini { 153abc3b08eSStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)(C->data); 154abc3b08eSStefano Zampini PetscErrorCode ierr; 155abc3b08eSStefano Zampini 156abc3b08eSStefano Zampini PetscFunctionBegin; 157ca15aa20SStefano Zampini if (c->ptapwork) { 158ca15aa20SStefano Zampini ierr = (*C->ops->matmultnumeric)(A,P,c->ptapwork);CHKERRQ(ierr); 159ca15aa20SStefano Zampini ierr = (*C->ops->transposematmultnumeric)(P,c->ptapwork,C);CHKERRQ(ierr); 1604222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"Must call MatPtAPSymbolic_SeqDense_SeqDense() first"); 161abc3b08eSStefano Zampini PetscFunctionReturn(0); 162abc3b08eSStefano Zampini } 163abc3b08eSStefano Zampini 1644222ddf1SHong Zhang PetscErrorCode MatPtAPSymbolic_SeqDense_SeqDense(Mat A,Mat P,PetscReal fill,Mat C) 165abc3b08eSStefano Zampini { 166abc3b08eSStefano Zampini Mat_SeqDense *c; 1677a3c3d58SStefano Zampini PetscBool cisdense; 168abc3b08eSStefano Zampini PetscErrorCode ierr; 169abc3b08eSStefano Zampini 170abc3b08eSStefano Zampini PetscFunctionBegin; 1714222ddf1SHong Zhang ierr = MatSetSizes(C,P->cmap->n,P->cmap->n,P->cmap->N,P->cmap->N);CHKERRQ(ierr); 1727a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 1737a3c3d58SStefano Zampini if (!cisdense) { 1747a3c3d58SStefano Zampini PetscBool flg; 1757a3c3d58SStefano Zampini 1767a3c3d58SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)P,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 1774222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 1787a3c3d58SStefano Zampini } 1797a3c3d58SStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 1804222ddf1SHong Zhang c = (Mat_SeqDense*)C->data; 181ca15aa20SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&c->ptapwork);CHKERRQ(ierr); 182ca15aa20SStefano Zampini ierr = MatSetSizes(c->ptapwork,A->rmap->n,P->cmap->n,A->rmap->N,P->cmap->N);CHKERRQ(ierr); 1837a3c3d58SStefano Zampini ierr = MatSetType(c->ptapwork,((PetscObject)C)->type_name);CHKERRQ(ierr); 1847a3c3d58SStefano Zampini ierr = MatSetUp(c->ptapwork);CHKERRQ(ierr); 185abc3b08eSStefano Zampini PetscFunctionReturn(0); 186abc3b08eSStefano Zampini } 187abc3b08eSStefano Zampini 188cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 189b49cda9fSStefano Zampini { 190a13144ffSStefano Zampini Mat B = NULL; 191b49cda9fSStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 192b49cda9fSStefano Zampini Mat_SeqDense *b; 193b49cda9fSStefano Zampini PetscErrorCode ierr; 194b49cda9fSStefano Zampini PetscInt *ai=a->i,*aj=a->j,m=A->rmap->N,n=A->cmap->N,i; 195b49cda9fSStefano Zampini MatScalar *av=a->a; 196a13144ffSStefano Zampini PetscBool isseqdense; 197b49cda9fSStefano Zampini 198b49cda9fSStefano Zampini PetscFunctionBegin; 199a13144ffSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 200a13144ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*newmat,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 201a32993e3SJed Brown if (!isseqdense) SETERRQ1(PetscObjectComm((PetscObject)*newmat),PETSC_ERR_USER,"Cannot reuse matrix of type %s",((PetscObject)(*newmat))->type_name); 202a13144ffSStefano Zampini } 203a13144ffSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 204b49cda9fSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 205b49cda9fSStefano Zampini ierr = MatSetSizes(B,m,n,m,n);CHKERRQ(ierr); 206b49cda9fSStefano Zampini ierr = MatSetType(B,MATSEQDENSE);CHKERRQ(ierr); 207b49cda9fSStefano Zampini ierr = MatSeqDenseSetPreallocation(B,NULL);CHKERRQ(ierr); 208b49cda9fSStefano Zampini b = (Mat_SeqDense*)(B->data); 209a13144ffSStefano Zampini } else { 210a13144ffSStefano Zampini b = (Mat_SeqDense*)((*newmat)->data); 211580bdb30SBarry Smith ierr = PetscArrayzero(b->v,m*n);CHKERRQ(ierr); 212a13144ffSStefano Zampini } 213b49cda9fSStefano Zampini for (i=0; i<m; i++) { 214b49cda9fSStefano Zampini PetscInt j; 215b49cda9fSStefano Zampini for (j=0;j<ai[1]-ai[0];j++) { 216b49cda9fSStefano Zampini b->v[*aj*m+i] = *av; 217b49cda9fSStefano Zampini aj++; 218b49cda9fSStefano Zampini av++; 219b49cda9fSStefano Zampini } 220b49cda9fSStefano Zampini ai++; 221b49cda9fSStefano Zampini } 222b49cda9fSStefano Zampini 223511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 224a13144ffSStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 225a13144ffSStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 227b49cda9fSStefano Zampini } else { 228a13144ffSStefano Zampini if (B) *newmat = B; 229a13144ffSStefano Zampini ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 230a13144ffSStefano Zampini ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 231b49cda9fSStefano Zampini } 232b49cda9fSStefano Zampini PetscFunctionReturn(0); 233b49cda9fSStefano Zampini } 234b49cda9fSStefano Zampini 235cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqAIJ(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 2366a63e612SBarry Smith { 2376a63e612SBarry Smith Mat B; 2386a63e612SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2396a63e612SBarry Smith PetscErrorCode ierr; 2409399e1b8SMatthew G. Knepley PetscInt i, j; 2419399e1b8SMatthew G. Knepley PetscInt *rows, *nnz; 2429399e1b8SMatthew G. Knepley MatScalar *aa = a->v, *vals; 2436a63e612SBarry Smith 2446a63e612SBarry Smith PetscFunctionBegin; 245ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 2466a63e612SBarry Smith ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2476a63e612SBarry Smith ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 2489399e1b8SMatthew G. Knepley ierr = PetscCalloc3(A->rmap->n,&rows,A->rmap->n,&nnz,A->rmap->n,&vals);CHKERRQ(ierr); 2499399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2509399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) ++nnz[i]; 2516a63e612SBarry Smith aa += a->lda; 2526a63e612SBarry Smith } 2539399e1b8SMatthew G. Knepley ierr = MatSeqAIJSetPreallocation(B,PETSC_DETERMINE,nnz);CHKERRQ(ierr); 2549399e1b8SMatthew G. Knepley aa = a->v; 2559399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2569399e1b8SMatthew G. Knepley PetscInt numRows = 0; 2579399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) {rows[numRows] = i; vals[numRows++] = aa[i];} 2589399e1b8SMatthew G. Knepley ierr = MatSetValues(B,numRows,rows,1,&j,vals,INSERT_VALUES);CHKERRQ(ierr); 2599399e1b8SMatthew G. Knepley aa += a->lda; 2609399e1b8SMatthew G. Knepley } 2619399e1b8SMatthew G. Knepley ierr = PetscFree3(rows,nnz,vals);CHKERRQ(ierr); 2626a63e612SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2636a63e612SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2646a63e612SBarry Smith 265511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 26628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 2676a63e612SBarry Smith } else { 2686a63e612SBarry Smith *newmat = B; 2696a63e612SBarry Smith } 2706a63e612SBarry Smith PetscFunctionReturn(0); 2716a63e612SBarry Smith } 2726a63e612SBarry Smith 273ca15aa20SStefano Zampini PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 2741987afe7SBarry Smith { 2751987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 276ca15aa20SStefano Zampini const PetscScalar *xv; 277ca15aa20SStefano Zampini PetscScalar *yv; 2780805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 279efee365bSSatish Balay PetscErrorCode ierr; 2803a40ed3dSBarry Smith 2813a40ed3dSBarry Smith PetscFunctionBegin; 282ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(X,&xv);CHKERRQ(ierr); 283ca15aa20SStefano Zampini ierr = MatDenseGetArray(Y,&yv);CHKERRQ(ierr); 284c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n*X->cmap->n,&N);CHKERRQ(ierr); 285c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n,&m);CHKERRQ(ierr); 286c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->lda,&ldax);CHKERRQ(ierr); 287c5df96a5SBarry Smith ierr = PetscBLASIntCast(y->lda,&lday);CHKERRQ(ierr); 288a5ce6ee0Svictorle if (ldax>m || lday>m) { 289ca15aa20SStefano Zampini PetscInt j; 290ca15aa20SStefano Zampini 291d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 292ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&m,&alpha,xv+j*ldax,&one,yv+j*lday,&one)); 293a5ce6ee0Svictorle } 294a5ce6ee0Svictorle } else { 295ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&N,&alpha,xv,&one,yv,&one)); 296a5ce6ee0Svictorle } 297ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(X,&xv);CHKERRQ(ierr); 298ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(Y,&yv);CHKERRQ(ierr); 2990450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 3003a40ed3dSBarry Smith PetscFunctionReturn(0); 3011987afe7SBarry Smith } 3021987afe7SBarry Smith 303e0877f53SBarry Smith static PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 304289bc588SBarry Smith { 305ca15aa20SStefano Zampini PetscLogDouble N = A->rmap->n*A->cmap->n; 3063a40ed3dSBarry Smith 3073a40ed3dSBarry Smith PetscFunctionBegin; 3084e220ebcSLois Curfman McInnes info->block_size = 1.0; 309ca15aa20SStefano Zampini info->nz_allocated = N; 310ca15aa20SStefano Zampini info->nz_used = N; 311ca15aa20SStefano Zampini info->nz_unneeded = 0; 312ca15aa20SStefano Zampini info->assemblies = A->num_ass; 3134e220ebcSLois Curfman McInnes info->mallocs = 0; 3147adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 3154e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 3164e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 3174e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 3183a40ed3dSBarry Smith PetscFunctionReturn(0); 319289bc588SBarry Smith } 320289bc588SBarry Smith 321637a0070SStefano Zampini PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 32280cd9d93SLois Curfman McInnes { 323273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 324ca15aa20SStefano Zampini PetscScalar *v; 325efee365bSSatish Balay PetscErrorCode ierr; 326c5df96a5SBarry Smith PetscBLASInt one = 1,j,nz,lda; 32780cd9d93SLois Curfman McInnes 3283a40ed3dSBarry Smith PetscFunctionBegin; 329ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 330c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->lda,&lda);CHKERRQ(ierr); 331d0f46423SBarry Smith if (lda>A->rmap->n) { 332c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&nz);CHKERRQ(ierr); 333d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 334ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v+j*lda,&one)); 335a5ce6ee0Svictorle } 336a5ce6ee0Svictorle } else { 337c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n*A->cmap->n,&nz);CHKERRQ(ierr); 338ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v,&one)); 339a5ce6ee0Svictorle } 340efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 341ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 3423a40ed3dSBarry Smith PetscFunctionReturn(0); 34380cd9d93SLois Curfman McInnes } 34480cd9d93SLois Curfman McInnes 345e0877f53SBarry Smith static PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 3461cbb95d3SBarry Smith { 3471cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 348ca15aa20SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 349ca15aa20SStefano Zampini const PetscScalar *v; 350ca15aa20SStefano Zampini PetscErrorCode ierr; 3511cbb95d3SBarry Smith 3521cbb95d3SBarry Smith PetscFunctionBegin; 3531cbb95d3SBarry Smith *fl = PETSC_FALSE; 354d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 355ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 3561cbb95d3SBarry Smith for (i=0; i<m; i++) { 357ca15aa20SStefano Zampini for (j=i; j<m; j++) { 358637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) { 359637a0070SStefano Zampini goto restore; 3601cbb95d3SBarry Smith } 3611cbb95d3SBarry Smith } 362637a0070SStefano Zampini } 3631cbb95d3SBarry Smith *fl = PETSC_TRUE; 364637a0070SStefano Zampini restore: 365637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 366637a0070SStefano Zampini PetscFunctionReturn(0); 367637a0070SStefano Zampini } 368637a0070SStefano Zampini 369637a0070SStefano Zampini static PetscErrorCode MatIsSymmetric_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 370637a0070SStefano Zampini { 371637a0070SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 372637a0070SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 373637a0070SStefano Zampini const PetscScalar *v; 374637a0070SStefano Zampini PetscErrorCode ierr; 375637a0070SStefano Zampini 376637a0070SStefano Zampini PetscFunctionBegin; 377637a0070SStefano Zampini *fl = PETSC_FALSE; 378637a0070SStefano Zampini if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 379637a0070SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 380637a0070SStefano Zampini for (i=0; i<m; i++) { 381637a0070SStefano Zampini for (j=i; j<m; j++) { 382637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - v[j+i*N]) > rtol) { 383637a0070SStefano Zampini goto restore; 384637a0070SStefano Zampini } 385637a0070SStefano Zampini } 386637a0070SStefano Zampini } 387637a0070SStefano Zampini *fl = PETSC_TRUE; 388637a0070SStefano Zampini restore: 389637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 3901cbb95d3SBarry Smith PetscFunctionReturn(0); 3911cbb95d3SBarry Smith } 3921cbb95d3SBarry Smith 393ca15aa20SStefano Zampini PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 394b24902e0SBarry Smith { 395ca15aa20SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 396b24902e0SBarry Smith PetscErrorCode ierr; 39723fc5dcaSStefano Zampini PetscInt lda = (PetscInt)mat->lda,j,m,nlda = lda; 398b24902e0SBarry Smith 399b24902e0SBarry Smith PetscFunctionBegin; 400aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&newi->rmap);CHKERRQ(ierr); 401aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&newi->cmap);CHKERRQ(ierr); 40223fc5dcaSStefano Zampini if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { /* propagate LDA */ 40323fc5dcaSStefano Zampini ierr = MatDenseSetLDA(newi,lda);CHKERRQ(ierr); 40423fc5dcaSStefano Zampini } 4050298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,NULL);CHKERRQ(ierr); 406b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 407ca15aa20SStefano Zampini const PetscScalar *av; 408ca15aa20SStefano Zampini PetscScalar *v; 409ca15aa20SStefano Zampini 410ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 411ca15aa20SStefano Zampini ierr = MatDenseGetArray(newi,&v);CHKERRQ(ierr); 41223fc5dcaSStefano Zampini ierr = MatDenseGetLDA(newi,&nlda);CHKERRQ(ierr); 413d0f46423SBarry Smith m = A->rmap->n; 41423fc5dcaSStefano Zampini if (lda>m || nlda>m) { 415d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 41623fc5dcaSStefano Zampini ierr = PetscArraycpy(v+j*nlda,av+j*lda,m);CHKERRQ(ierr); 417b24902e0SBarry Smith } 418b24902e0SBarry Smith } else { 419ca15aa20SStefano Zampini ierr = PetscArraycpy(v,av,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 420b24902e0SBarry Smith } 421ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newi,&v);CHKERRQ(ierr); 422ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 423b24902e0SBarry Smith } 424b24902e0SBarry Smith PetscFunctionReturn(0); 425b24902e0SBarry Smith } 426b24902e0SBarry Smith 427ca15aa20SStefano Zampini PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 42802cad45dSBarry Smith { 4296849ba73SBarry Smith PetscErrorCode ierr; 43002cad45dSBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 432ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),newmat);CHKERRQ(ierr); 433d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4345c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 435719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 436b24902e0SBarry Smith PetscFunctionReturn(0); 437b24902e0SBarry Smith } 438b24902e0SBarry Smith 439e0877f53SBarry Smith static PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 440289bc588SBarry Smith { 4414482741eSBarry Smith MatFactorInfo info; 442a093e273SMatthew Knepley PetscErrorCode ierr; 4433a40ed3dSBarry Smith 4443a40ed3dSBarry Smith PetscFunctionBegin; 445c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 446ca15aa20SStefano Zampini ierr = (*fact->ops->lufactor)(fact,0,0,&info);CHKERRQ(ierr); 4473a40ed3dSBarry Smith PetscFunctionReturn(0); 448289bc588SBarry Smith } 4496ee01492SSatish Balay 450e0877f53SBarry Smith static PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 451289bc588SBarry Smith { 452c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 4536849ba73SBarry Smith PetscErrorCode ierr; 454f1ceaac6SMatthew G. Knepley const PetscScalar *x; 455f1ceaac6SMatthew G. Knepley PetscScalar *y; 456c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 45767e560aaSBarry Smith 4583a40ed3dSBarry Smith PetscFunctionBegin; 459c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 460f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 4611ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 462580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 463d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 46400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4658b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 46600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 467e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 468d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 469a49dc2a2SStefano Zampini if (A->spd) { 47000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4718b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 47200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 473e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 474a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 475a49dc2a2SStefano Zampini } else if (A->hermitian) { 47600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 477a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 47800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 479a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 480a49dc2a2SStefano Zampini #endif 481a49dc2a2SStefano Zampini } else { /* symmetric case */ 48200121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 483a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 48400121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 485a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 486a49dc2a2SStefano Zampini } 4872205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 488f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 4891ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 490dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 4913a40ed3dSBarry Smith PetscFunctionReturn(0); 492289bc588SBarry Smith } 4936ee01492SSatish Balay 494e0877f53SBarry Smith static PetscErrorCode MatMatSolve_SeqDense(Mat A,Mat B,Mat X) 49585e2c93fSHong Zhang { 49685e2c93fSHong Zhang Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 49785e2c93fSHong Zhang PetscErrorCode ierr; 4981683a169SBarry Smith const PetscScalar *b; 4991683a169SBarry Smith PetscScalar *x; 500efb80c78SLisandro Dalcin PetscInt n; 501783b601eSJed Brown PetscBLASInt nrhs,info,m; 50285e2c93fSHong Zhang 50385e2c93fSHong Zhang PetscFunctionBegin; 504c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 5050298fd71SBarry Smith ierr = MatGetSize(B,NULL,&n);CHKERRQ(ierr); 506c5df96a5SBarry Smith ierr = PetscBLASIntCast(n,&nrhs);CHKERRQ(ierr); 5071683a169SBarry Smith ierr = MatDenseGetArrayRead(B,&b);CHKERRQ(ierr); 5088c778c55SBarry Smith ierr = MatDenseGetArray(X,&x);CHKERRQ(ierr); 50985e2c93fSHong Zhang 510580bdb30SBarry Smith ierr = PetscArraycpy(x,b,m*nrhs);CHKERRQ(ierr); 51185e2c93fSHong Zhang 51285e2c93fSHong Zhang if (A->factortype == MAT_FACTOR_LU) { 51300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5148b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 51500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 51685e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 51785e2c93fSHong Zhang } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 518a49dc2a2SStefano Zampini if (A->spd) { 51900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5208b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&nrhs,mat->v,&mat->lda,x,&m,&info)); 52100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 52285e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 523a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 524a49dc2a2SStefano Zampini } else if (A->hermitian) { 52500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 526a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 52700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 528a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 529a49dc2a2SStefano Zampini #endif 530a49dc2a2SStefano Zampini } else { /* symmetric case */ 53100121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 532a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 53300121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 534a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 535a49dc2a2SStefano Zampini } 5362205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 53785e2c93fSHong Zhang 5381683a169SBarry Smith ierr = MatDenseRestoreArrayRead(B,&b);CHKERRQ(ierr); 5398c778c55SBarry Smith ierr = MatDenseRestoreArray(X,&x);CHKERRQ(ierr); 54085e2c93fSHong Zhang ierr = PetscLogFlops(nrhs*(2.0*m*m - m));CHKERRQ(ierr); 54185e2c93fSHong Zhang PetscFunctionReturn(0); 54285e2c93fSHong Zhang } 54385e2c93fSHong Zhang 54400121966SStefano Zampini static PetscErrorCode MatConjugate_SeqDense(Mat); 54500121966SStefano Zampini 546e0877f53SBarry Smith static PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 547da3a660dSBarry Smith { 548c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 549dfbe8321SBarry Smith PetscErrorCode ierr; 550f1ceaac6SMatthew G. Knepley const PetscScalar *x; 551f1ceaac6SMatthew G. Knepley PetscScalar *y; 552c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 55367e560aaSBarry Smith 5543a40ed3dSBarry Smith PetscFunctionBegin; 555c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 556f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 5571ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 558580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 5598208b9aeSStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 56000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5618b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 56200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 563e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 5648208b9aeSStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 565a49dc2a2SStefano Zampini if (A->spd) { 56600121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 56700121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 56800121966SStefano Zampini #endif 56900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5708b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 57100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57200121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 57300121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57400121966SStefano Zampini #endif 575a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 576a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 577a49dc2a2SStefano Zampini } else if (A->hermitian) { 57800121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 58000121966SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 58200121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 583ae7cfcebSSatish Balay #endif 584a49dc2a2SStefano Zampini } else { /* symmetric case */ 58500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 586a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 588a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 589da3a660dSBarry Smith } 590a49dc2a2SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 591f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 5921ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 593dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 5943a40ed3dSBarry Smith PetscFunctionReturn(0); 595da3a660dSBarry Smith } 5966ee01492SSatish Balay 597db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 598db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 599db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 600ca15aa20SStefano Zampini PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 601db4efbfdSBarry Smith { 602db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 603db4efbfdSBarry Smith PetscErrorCode ierr; 604db4efbfdSBarry Smith PetscBLASInt n,m,info; 605db4efbfdSBarry Smith 606db4efbfdSBarry Smith PetscFunctionBegin; 607c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 608c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 609db4efbfdSBarry Smith if (!mat->pivots) { 6108208b9aeSStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 6113bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 612db4efbfdSBarry Smith } 613db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 6148e57ea43SSatish Balay ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6158b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info)); 6168e57ea43SSatish Balay ierr = PetscFPTrapPop();CHKERRQ(ierr); 6178e57ea43SSatish Balay 618e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 619e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 6208208b9aeSStefano Zampini 621db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6228208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 623db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 624d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 625db4efbfdSBarry Smith 626f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 627f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 628f6224b95SHong Zhang 629dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 630db4efbfdSBarry Smith PetscFunctionReturn(0); 631db4efbfdSBarry Smith } 632db4efbfdSBarry Smith 633a49dc2a2SStefano Zampini /* Cholesky as L*L^T or L*D*L^T and the symmetric/hermitian complex variants */ 634ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 635db4efbfdSBarry Smith { 636db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 637db4efbfdSBarry Smith PetscErrorCode ierr; 638c5df96a5SBarry Smith PetscBLASInt info,n; 639db4efbfdSBarry Smith 640db4efbfdSBarry Smith PetscFunctionBegin; 641c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 642db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 643a49dc2a2SStefano Zampini if (A->spd) { 64400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6458b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info)); 64600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 647a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 648a49dc2a2SStefano Zampini } else if (A->hermitian) { 649a49dc2a2SStefano Zampini if (!mat->pivots) { 650a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 651a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 652a49dc2a2SStefano Zampini } 653a49dc2a2SStefano Zampini if (!mat->fwork) { 654a49dc2a2SStefano Zampini PetscScalar dummy; 655a49dc2a2SStefano Zampini 656a49dc2a2SStefano Zampini mat->lfwork = -1; 65700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 658a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 65900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 660a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 661a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 662a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 663a49dc2a2SStefano Zampini } 66400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 665a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 66600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 667a49dc2a2SStefano Zampini #endif 668a49dc2a2SStefano Zampini } else { /* symmetric case */ 669a49dc2a2SStefano Zampini if (!mat->pivots) { 670a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 671a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 672a49dc2a2SStefano Zampini } 673a49dc2a2SStefano Zampini if (!mat->fwork) { 674a49dc2a2SStefano Zampini PetscScalar dummy; 675a49dc2a2SStefano Zampini 676a49dc2a2SStefano Zampini mat->lfwork = -1; 67700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 678a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 67900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 680a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 681a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 682a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 683a49dc2a2SStefano Zampini } 68400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 685a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 68600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 687a49dc2a2SStefano Zampini } 688e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 6898208b9aeSStefano Zampini 690db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6918208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 692db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 693d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 6942205254eSKarl Rupp 695f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 696f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 697f6224b95SHong Zhang 698eb3f19e4SBarry Smith ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 699db4efbfdSBarry Smith PetscFunctionReturn(0); 700db4efbfdSBarry Smith } 701db4efbfdSBarry Smith 7020481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 703db4efbfdSBarry Smith { 704db4efbfdSBarry Smith PetscErrorCode ierr; 705db4efbfdSBarry Smith MatFactorInfo info; 706db4efbfdSBarry Smith 707db4efbfdSBarry Smith PetscFunctionBegin; 708db4efbfdSBarry Smith info.fill = 1.0; 7092205254eSKarl Rupp 710c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 711ca15aa20SStefano Zampini ierr = (*fact->ops->choleskyfactor)(fact,0,&info);CHKERRQ(ierr); 712db4efbfdSBarry Smith PetscFunctionReturn(0); 713db4efbfdSBarry Smith } 714db4efbfdSBarry Smith 715ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 716db4efbfdSBarry Smith { 717db4efbfdSBarry Smith PetscFunctionBegin; 718c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 7191bbcc794SSatish Balay fact->preallocated = PETSC_TRUE; 720719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 721bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 722bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 723bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 724db4efbfdSBarry Smith PetscFunctionReturn(0); 725db4efbfdSBarry Smith } 726db4efbfdSBarry Smith 727ca15aa20SStefano Zampini PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 728db4efbfdSBarry Smith { 729db4efbfdSBarry Smith PetscFunctionBegin; 730b66fe19dSMatthew G Knepley fact->preallocated = PETSC_TRUE; 731c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 732719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 733bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 734bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 735bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 736db4efbfdSBarry Smith PetscFunctionReturn(0); 737db4efbfdSBarry Smith } 738db4efbfdSBarry Smith 739ca15aa20SStefano Zampini /* uses LAPACK */ 740cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 741db4efbfdSBarry Smith { 742db4efbfdSBarry Smith PetscErrorCode ierr; 743db4efbfdSBarry Smith 744db4efbfdSBarry Smith PetscFunctionBegin; 745ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),fact);CHKERRQ(ierr); 746db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 747ca15aa20SStefano Zampini ierr = MatSetType(*fact,MATDENSE);CHKERRQ(ierr); 748db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU) { 749db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 750db4efbfdSBarry Smith } else { 751db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 752db4efbfdSBarry Smith } 753d5f3da31SBarry Smith (*fact)->factortype = ftype; 75400c67f3bSHong Zhang 75500c67f3bSHong Zhang ierr = PetscFree((*fact)->solvertype);CHKERRQ(ierr); 75600c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&(*fact)->solvertype);CHKERRQ(ierr); 757db4efbfdSBarry Smith PetscFunctionReturn(0); 758db4efbfdSBarry Smith } 759db4efbfdSBarry Smith 760289bc588SBarry Smith /* ------------------------------------------------------------------*/ 761e0877f53SBarry Smith static PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 762289bc588SBarry Smith { 763c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 764d9ca1df4SBarry Smith PetscScalar *x,*v = mat->v,zero = 0.0,xt; 765d9ca1df4SBarry Smith const PetscScalar *b; 766dfbe8321SBarry Smith PetscErrorCode ierr; 767d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 768c5df96a5SBarry Smith PetscBLASInt o = 1,bm; 769289bc588SBarry Smith 7703a40ed3dSBarry Smith PetscFunctionBegin; 771ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 772c70f7ee4SJunchao Zhang if (A->offloadmask == PETSC_OFFLOAD_GPU) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 773ca15aa20SStefano Zampini #endif 774422a814eSBarry Smith if (shift == -1) shift = 0.0; /* negative shift indicates do not error on zero diagonal; this code never zeros on zero diagonal */ 775c5df96a5SBarry Smith ierr = PetscBLASIntCast(m,&bm);CHKERRQ(ierr); 776289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 7773bffc371SBarry Smith /* this is a hack fix, should have another version without the second BLASdotu */ 7782dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 779289bc588SBarry Smith } 7801ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 781d9ca1df4SBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 782b965ef7fSBarry Smith its = its*lits; 783e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 784289bc588SBarry Smith while (its--) { 785fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 786289bc588SBarry Smith for (i=0; i<m; i++) { 7873bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 78855a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 789289bc588SBarry Smith } 790289bc588SBarry Smith } 791fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 792289bc588SBarry Smith for (i=m-1; i>=0; i--) { 7933bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 79455a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 795289bc588SBarry Smith } 796289bc588SBarry Smith } 797289bc588SBarry Smith } 798d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 7991ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 8003a40ed3dSBarry Smith PetscFunctionReturn(0); 801289bc588SBarry Smith } 802289bc588SBarry Smith 803289bc588SBarry Smith /* -----------------------------------------------------------------*/ 804ca15aa20SStefano Zampini PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 805289bc588SBarry Smith { 806c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 807d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 808d9ca1df4SBarry Smith PetscScalar *y; 809dfbe8321SBarry Smith PetscErrorCode ierr; 8100805154bSBarry Smith PetscBLASInt m, n,_One=1; 811ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 8123a40ed3dSBarry Smith 8133a40ed3dSBarry Smith PetscFunctionBegin; 814c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 815c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 816d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8172bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8185ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8195ac36cfcSBarry Smith PetscBLASInt i; 8205ac36cfcSBarry Smith for (i=0; i<n; i++) y[i] = 0.0; 8215ac36cfcSBarry Smith } else { 8228b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One)); 8235ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 8245ac36cfcSBarry Smith } 825d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8262bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8273a40ed3dSBarry Smith PetscFunctionReturn(0); 828289bc588SBarry Smith } 829800995b7SMatthew Knepley 830ca15aa20SStefano Zampini PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 831289bc588SBarry Smith { 832c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 833d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0,_DZero=0.0; 834dfbe8321SBarry Smith PetscErrorCode ierr; 8350805154bSBarry Smith PetscBLASInt m, n, _One=1; 836d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 8373a40ed3dSBarry Smith 8383a40ed3dSBarry Smith PetscFunctionBegin; 839c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 840c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 841d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8422bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8435ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8445ac36cfcSBarry Smith PetscBLASInt i; 8455ac36cfcSBarry Smith for (i=0; i<m; i++) y[i] = 0.0; 8465ac36cfcSBarry Smith } else { 8478b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One)); 8485ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 8495ac36cfcSBarry Smith } 850d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8512bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8523a40ed3dSBarry Smith PetscFunctionReturn(0); 853289bc588SBarry Smith } 8546ee01492SSatish Balay 855ca15aa20SStefano Zampini PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 856289bc588SBarry Smith { 857c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 858d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 859d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0; 860dfbe8321SBarry Smith PetscErrorCode ierr; 8610805154bSBarry Smith PetscBLASInt m, n, _One=1; 8623a40ed3dSBarry Smith 8633a40ed3dSBarry Smith PetscFunctionBegin; 864c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 865c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 866d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 867600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 868d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8691ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8708b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 871d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8721ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 873dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8743a40ed3dSBarry Smith PetscFunctionReturn(0); 875289bc588SBarry Smith } 8766ee01492SSatish Balay 877ca15aa20SStefano Zampini PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 878289bc588SBarry Smith { 879c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 880d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 881d9ca1df4SBarry Smith PetscScalar *y; 882dfbe8321SBarry Smith PetscErrorCode ierr; 8830805154bSBarry Smith PetscBLASInt m, n, _One=1; 88487828ca2SBarry Smith PetscScalar _DOne=1.0; 8853a40ed3dSBarry Smith 8863a40ed3dSBarry Smith PetscFunctionBegin; 887c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 888c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 889d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 890600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 891d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8921ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8938b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 894d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8951ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 896dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8973a40ed3dSBarry Smith PetscFunctionReturn(0); 898289bc588SBarry Smith } 899289bc588SBarry Smith 900289bc588SBarry Smith /* -----------------------------------------------------------------*/ 901e0877f53SBarry Smith static PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 902289bc588SBarry Smith { 903c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 9046849ba73SBarry Smith PetscErrorCode ierr; 90513f74950SBarry Smith PetscInt i; 90667e560aaSBarry Smith 9073a40ed3dSBarry Smith PetscFunctionBegin; 908d0f46423SBarry Smith *ncols = A->cmap->n; 909289bc588SBarry Smith if (cols) { 910854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,cols);CHKERRQ(ierr); 911d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 912289bc588SBarry Smith } 913289bc588SBarry Smith if (vals) { 914ca15aa20SStefano Zampini const PetscScalar *v; 915ca15aa20SStefano Zampini 916ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 917854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,vals);CHKERRQ(ierr); 918ca15aa20SStefano Zampini v += row; 919d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 920ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 921289bc588SBarry Smith } 9223a40ed3dSBarry Smith PetscFunctionReturn(0); 923289bc588SBarry Smith } 9246ee01492SSatish Balay 925e0877f53SBarry Smith static PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 926289bc588SBarry Smith { 927dfbe8321SBarry Smith PetscErrorCode ierr; 9286e111a19SKarl Rupp 929606d414cSSatish Balay PetscFunctionBegin; 930606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 931606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 9323a40ed3dSBarry Smith PetscFunctionReturn(0); 933289bc588SBarry Smith } 934289bc588SBarry Smith /* ----------------------------------------------------------------*/ 935e0877f53SBarry Smith static PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 936289bc588SBarry Smith { 937c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 938ca15aa20SStefano Zampini PetscScalar *av; 93913f74950SBarry Smith PetscInt i,j,idx=0; 940ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 941c70f7ee4SJunchao Zhang PetscOffloadMask oldf; 942ca15aa20SStefano Zampini #endif 943ca15aa20SStefano Zampini PetscErrorCode ierr; 944d6dfbf8fSBarry Smith 9453a40ed3dSBarry Smith PetscFunctionBegin; 946ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&av);CHKERRQ(ierr); 947289bc588SBarry Smith if (!mat->roworiented) { 948dbb450caSBarry Smith if (addv == INSERT_VALUES) { 949289bc588SBarry Smith for (j=0; j<n; j++) { 950cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 951cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 952289bc588SBarry Smith for (i=0; i<m; i++) { 953cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 954cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 955ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 956289bc588SBarry Smith } 957289bc588SBarry Smith } 9583a40ed3dSBarry Smith } else { 959289bc588SBarry Smith for (j=0; j<n; j++) { 960cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 961cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 962289bc588SBarry Smith for (i=0; i<m; i++) { 963cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 964cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 965ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 966289bc588SBarry Smith } 967289bc588SBarry Smith } 968289bc588SBarry Smith } 9693a40ed3dSBarry Smith } else { 970dbb450caSBarry Smith if (addv == INSERT_VALUES) { 971e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 972cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 973cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 974e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 975cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 976cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 977ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 978e8d4e0b9SBarry Smith } 979e8d4e0b9SBarry Smith } 9803a40ed3dSBarry Smith } else { 981289bc588SBarry Smith for (i=0; i<m; i++) { 982cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 983cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 984289bc588SBarry Smith for (j=0; j<n; j++) { 985cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 986cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 987ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 988289bc588SBarry Smith } 989289bc588SBarry Smith } 990289bc588SBarry Smith } 991e8d4e0b9SBarry Smith } 992ca15aa20SStefano Zampini /* hack to prevent unneeded copy to the GPU while returning the array */ 993ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 994c70f7ee4SJunchao Zhang oldf = A->offloadmask; 995c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_GPU; 996ca15aa20SStefano Zampini #endif 997ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&av);CHKERRQ(ierr); 998ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 999c70f7ee4SJunchao Zhang A->offloadmask = (oldf == PETSC_OFFLOAD_UNALLOCATED ? PETSC_OFFLOAD_UNALLOCATED : PETSC_OFFLOAD_CPU); 1000ca15aa20SStefano Zampini #endif 10013a40ed3dSBarry Smith PetscFunctionReturn(0); 1002289bc588SBarry Smith } 1003e8d4e0b9SBarry Smith 1004e0877f53SBarry Smith static PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 1005ae80bb75SLois Curfman McInnes { 1006ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1007ca15aa20SStefano Zampini const PetscScalar *vv; 100813f74950SBarry Smith PetscInt i,j; 1009ca15aa20SStefano Zampini PetscErrorCode ierr; 1010ae80bb75SLois Curfman McInnes 10113a40ed3dSBarry Smith PetscFunctionBegin; 1012ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1013ae80bb75SLois Curfman McInnes /* row-oriented output */ 1014ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 101597e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 1016e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 1017ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 10186f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 1019e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 1020ca15aa20SStefano Zampini *v++ = vv[indexn[j]*mat->lda + indexm[i]]; 1021ae80bb75SLois Curfman McInnes } 1022ae80bb75SLois Curfman McInnes } 1023ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 10243a40ed3dSBarry Smith PetscFunctionReturn(0); 1025ae80bb75SLois Curfman McInnes } 1026ae80bb75SLois Curfman McInnes 1027289bc588SBarry Smith /* -----------------------------------------------------------------*/ 1028289bc588SBarry Smith 10298491ab44SLisandro Dalcin PetscErrorCode MatView_Dense_Binary(Mat mat,PetscViewer viewer) 1030aabbc4fbSShri Abhyankar { 1031aabbc4fbSShri Abhyankar PetscErrorCode ierr; 10328491ab44SLisandro Dalcin PetscBool skipHeader; 10338491ab44SLisandro Dalcin PetscViewerFormat format; 10348491ab44SLisandro Dalcin PetscInt header[4],M,N,m,lda,i,j,k; 10358491ab44SLisandro Dalcin const PetscScalar *v; 10368491ab44SLisandro Dalcin PetscScalar *vwork; 1037aabbc4fbSShri Abhyankar 1038aabbc4fbSShri Abhyankar PetscFunctionBegin; 10398491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10408491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10418491ab44SLisandro Dalcin ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 10428491ab44SLisandro Dalcin if (skipHeader) format = PETSC_VIEWER_NATIVE; 1043aabbc4fbSShri Abhyankar 10448491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 10458491ab44SLisandro Dalcin 10468491ab44SLisandro Dalcin /* write matrix header */ 10478491ab44SLisandro Dalcin header[0] = MAT_FILE_CLASSID; header[1] = M; header[2] = N; 10488491ab44SLisandro Dalcin header[3] = (format == PETSC_VIEWER_NATIVE) ? MATRIX_BINARY_FORMAT_DENSE : M*N; 10498491ab44SLisandro Dalcin if (!skipHeader) {ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr);} 10508491ab44SLisandro Dalcin 10518491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 10528491ab44SLisandro Dalcin if (format != PETSC_VIEWER_NATIVE) { 10538491ab44SLisandro Dalcin PetscInt nnz = m*N, *iwork; 10548491ab44SLisandro Dalcin /* store row lengths for each row */ 10558491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&iwork);CHKERRQ(ierr); 10568491ab44SLisandro Dalcin for (i=0; i<m; i++) iwork[i] = N; 10578491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10588491ab44SLisandro Dalcin /* store column indices (zero start index) */ 10598491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10608491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10618491ab44SLisandro Dalcin iwork[k] = j; 10628491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10638491ab44SLisandro Dalcin ierr = PetscFree(iwork);CHKERRQ(ierr); 10648491ab44SLisandro Dalcin } 10658491ab44SLisandro Dalcin /* store matrix values as a dense matrix in row major order */ 10668491ab44SLisandro Dalcin ierr = PetscMalloc1(m*N,&vwork);CHKERRQ(ierr); 10678491ab44SLisandro Dalcin ierr = MatDenseGetArrayRead(mat,&v);CHKERRQ(ierr); 10688491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 10698491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10708491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10718491ab44SLisandro Dalcin vwork[k] = v[i+lda*j]; 10728491ab44SLisandro Dalcin ierr = MatDenseRestoreArrayRead(mat,&v);CHKERRQ(ierr); 10738491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,vwork,m*N,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 10748491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 10758491ab44SLisandro Dalcin PetscFunctionReturn(0); 10768491ab44SLisandro Dalcin } 10778491ab44SLisandro Dalcin 10788491ab44SLisandro Dalcin PetscErrorCode MatLoad_Dense_Binary(Mat mat,PetscViewer viewer) 10798491ab44SLisandro Dalcin { 10808491ab44SLisandro Dalcin PetscErrorCode ierr; 10818491ab44SLisandro Dalcin PetscBool skipHeader; 10828491ab44SLisandro Dalcin PetscInt header[4],M,N,m,nz,lda,i,j,k; 10838491ab44SLisandro Dalcin PetscInt rows,cols; 10848491ab44SLisandro Dalcin PetscScalar *v,*vwork; 10858491ab44SLisandro Dalcin 10868491ab44SLisandro Dalcin PetscFunctionBegin; 10878491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10888491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10898491ab44SLisandro Dalcin 10908491ab44SLisandro Dalcin if (!skipHeader) { 10918491ab44SLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 10928491ab44SLisandro Dalcin if (header[0] != MAT_FILE_CLASSID) SETERRQ(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 10938491ab44SLisandro Dalcin M = header[1]; N = header[2]; 10948491ab44SLisandro Dalcin if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M); 10958491ab44SLisandro Dalcin if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N); 10968491ab44SLisandro Dalcin nz = header[3]; 10978491ab44SLisandro Dalcin if (nz != MATRIX_BINARY_FORMAT_DENSE && nz < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Unknown matrix format %D in file",nz); 1098aabbc4fbSShri Abhyankar } else { 10998491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 11008491ab44SLisandro Dalcin if (M < 0 || N < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Matrix binary file header was skipped, thus the user must specify the global sizes of input matrix"); 11018491ab44SLisandro Dalcin nz = MATRIX_BINARY_FORMAT_DENSE; 1102e6324fbbSBarry Smith } 1103aabbc4fbSShri Abhyankar 11048491ab44SLisandro Dalcin /* setup global sizes if not set */ 11058491ab44SLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 11068491ab44SLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 11078491ab44SLisandro Dalcin ierr = MatSetUp(mat);CHKERRQ(ierr); 11088491ab44SLisandro Dalcin /* check if global sizes are correct */ 11098491ab44SLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 11108491ab44SLisandro Dalcin if (M != rows || N != cols) SETERRQ4(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 1111aabbc4fbSShri Abhyankar 11128491ab44SLisandro Dalcin ierr = MatGetSize(mat,NULL,&N);CHKERRQ(ierr); 11138491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 11148491ab44SLisandro Dalcin ierr = MatDenseGetArray(mat,&v);CHKERRQ(ierr); 11158491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 11168491ab44SLisandro Dalcin if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense format */ 11178491ab44SLisandro Dalcin PetscInt nnz = m*N; 11188491ab44SLisandro Dalcin /* read in matrix values */ 11198491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&vwork);CHKERRQ(ierr); 11208491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11218491ab44SLisandro Dalcin /* store values in column major order */ 11228491ab44SLisandro Dalcin for (j=0; j<N; j++) 11238491ab44SLisandro Dalcin for (i=0; i<m; i++) 11248491ab44SLisandro Dalcin v[i+lda*j] = vwork[i*N+j]; 11258491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 11268491ab44SLisandro Dalcin } else { /* matrix in file is sparse format */ 11278491ab44SLisandro Dalcin PetscInt nnz = 0, *rlens, *icols; 11288491ab44SLisandro Dalcin /* read in row lengths */ 11298491ab44SLisandro Dalcin ierr = PetscMalloc1(m,&rlens);CHKERRQ(ierr); 11308491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,rlens,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11318491ab44SLisandro Dalcin for (i=0; i<m; i++) nnz += rlens[i]; 11328491ab44SLisandro Dalcin /* read in column indices and values */ 11338491ab44SLisandro Dalcin ierr = PetscMalloc2(nnz,&icols,nnz,&vwork);CHKERRQ(ierr); 11348491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,icols,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11358491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11368491ab44SLisandro Dalcin /* store values in column major order */ 11378491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 11388491ab44SLisandro Dalcin for (j=0; j<rlens[i]; j++, k++) 11398491ab44SLisandro Dalcin v[i+lda*icols[k]] = vwork[k]; 11408491ab44SLisandro Dalcin ierr = PetscFree(rlens);CHKERRQ(ierr); 11418491ab44SLisandro Dalcin ierr = PetscFree2(icols,vwork);CHKERRQ(ierr); 1142aabbc4fbSShri Abhyankar } 11438491ab44SLisandro Dalcin ierr = MatDenseRestoreArray(mat,&v);CHKERRQ(ierr); 11448491ab44SLisandro Dalcin ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 11458491ab44SLisandro Dalcin ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1146aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 1147aabbc4fbSShri Abhyankar } 1148aabbc4fbSShri Abhyankar 1149eb91f321SVaclav Hapla PetscErrorCode MatLoad_SeqDense(Mat newMat, PetscViewer viewer) 1150eb91f321SVaclav Hapla { 1151eb91f321SVaclav Hapla PetscBool isbinary, ishdf5; 1152eb91f321SVaclav Hapla PetscErrorCode ierr; 1153eb91f321SVaclav Hapla 1154eb91f321SVaclav Hapla PetscFunctionBegin; 1155eb91f321SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 1156eb91f321SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 1157eb91f321SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 1158eb91f321SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 1159eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1160eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 1161eb91f321SVaclav Hapla if (isbinary) { 11628491ab44SLisandro Dalcin ierr = MatLoad_Dense_Binary(newMat,viewer);CHKERRQ(ierr); 1163eb91f321SVaclav Hapla } else if (ishdf5) { 1164eb91f321SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 1165eb91f321SVaclav Hapla ierr = MatLoad_Dense_HDF5(newMat,viewer);CHKERRQ(ierr); 1166eb91f321SVaclav Hapla #else 1167eb91f321SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 1168eb91f321SVaclav Hapla #endif 1169eb91f321SVaclav Hapla } else { 1170eb91f321SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 1171eb91f321SVaclav Hapla } 1172eb91f321SVaclav Hapla PetscFunctionReturn(0); 1173eb91f321SVaclav Hapla } 1174eb91f321SVaclav Hapla 11756849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 1176289bc588SBarry Smith { 1177932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1178dfbe8321SBarry Smith PetscErrorCode ierr; 117913f74950SBarry Smith PetscInt i,j; 11802dcb1b2aSMatthew Knepley const char *name; 1181ca15aa20SStefano Zampini PetscScalar *v,*av; 1182f3ef73ceSBarry Smith PetscViewerFormat format; 11835f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 1184ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 11855f481a85SSatish Balay #endif 1186932b0c3eSLois Curfman McInnes 11873a40ed3dSBarry Smith PetscFunctionBegin; 1188ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1189b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1190456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 11913a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 1192fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 1193d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1194d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1195ca15aa20SStefano Zampini v = av + i; 119677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 1197d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1198aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1199329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 120057622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",j,(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 1201329f5518SBarry Smith } else if (PetscRealPart(*v)) { 120257622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)PetscRealPart(*v));CHKERRQ(ierr); 12036831982aSBarry Smith } 120480cd9d93SLois Curfman McInnes #else 12056831982aSBarry Smith if (*v) { 120657622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)*v);CHKERRQ(ierr); 12076831982aSBarry Smith } 120880cd9d93SLois Curfman McInnes #endif 12091b807ce4Svictorle v += a->lda; 121080cd9d93SLois Curfman McInnes } 1211b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 121280cd9d93SLois Curfman McInnes } 1213d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 12143a40ed3dSBarry Smith } else { 1215d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1216aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 121747989497SBarry Smith /* determine if matrix has all real values */ 1218ca15aa20SStefano Zampini v = av; 1219d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 1220ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break;} 122147989497SBarry Smith } 122247989497SBarry Smith #endif 1223fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 12243a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 1225d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1226d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1227fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 1228ffac6cdbSBarry Smith } 1229ffac6cdbSBarry Smith 1230d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1231ca15aa20SStefano Zampini v = av + i; 1232d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1233aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 123447989497SBarry Smith if (allreal) { 1235c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)PetscRealPart(*v));CHKERRQ(ierr); 123647989497SBarry Smith } else { 1237c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16ei ",(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 123847989497SBarry Smith } 1239289bc588SBarry Smith #else 1240c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)*v);CHKERRQ(ierr); 1241289bc588SBarry Smith #endif 12421b807ce4Svictorle v += a->lda; 1243289bc588SBarry Smith } 1244b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 1245289bc588SBarry Smith } 1246fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 1247b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 1248ffac6cdbSBarry Smith } 1249d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 1250da3a660dSBarry Smith } 1251ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1252b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 12533a40ed3dSBarry Smith PetscFunctionReturn(0); 1254289bc588SBarry Smith } 1255289bc588SBarry Smith 12569804daf3SBarry Smith #include <petscdraw.h> 1257e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 1258f1af5d2fSBarry Smith { 1259f1af5d2fSBarry Smith Mat A = (Mat) Aa; 12606849ba73SBarry Smith PetscErrorCode ierr; 1261383922c3SLisandro Dalcin PetscInt m = A->rmap->n,n = A->cmap->n,i,j; 1262383922c3SLisandro Dalcin int color = PETSC_DRAW_WHITE; 1263ca15aa20SStefano Zampini const PetscScalar *v; 1264b0a32e0cSBarry Smith PetscViewer viewer; 1265b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 1266f3ef73ceSBarry Smith PetscViewerFormat format; 1267f1af5d2fSBarry Smith 1268f1af5d2fSBarry Smith PetscFunctionBegin; 1269f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 1270b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1271b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 1272f1af5d2fSBarry Smith 1273f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 1274ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 1275fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1276383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1277f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 1278f1af5d2fSBarry Smith for (j = 0; j < n; j++) { 1279383922c3SLisandro Dalcin x_l = j; x_r = x_l + 1.0; 1280f1af5d2fSBarry Smith for (i = 0; i < m; i++) { 1281f1af5d2fSBarry Smith y_l = m - i - 1.0; 1282f1af5d2fSBarry Smith y_r = y_l + 1.0; 1283ca15aa20SStefano Zampini if (PetscRealPart(v[j*m+i]) > 0.) color = PETSC_DRAW_RED; 1284ca15aa20SStefano Zampini else if (PetscRealPart(v[j*m+i]) < 0.) color = PETSC_DRAW_BLUE; 1285ca15aa20SStefano Zampini else continue; 1286b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1287f1af5d2fSBarry Smith } 1288f1af5d2fSBarry Smith } 1289383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1290f1af5d2fSBarry Smith } else { 1291f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1292f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1293b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1294b05fc000SLisandro Dalcin PetscDraw popup; 1295b05fc000SLisandro Dalcin 1296f1af5d2fSBarry Smith for (i=0; i < m*n; i++) { 1297f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1298f1af5d2fSBarry Smith } 1299383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 1300b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 130145f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 1302383922c3SLisandro Dalcin 1303383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1304f1af5d2fSBarry Smith for (j=0; j<n; j++) { 1305f1af5d2fSBarry Smith x_l = j; 1306f1af5d2fSBarry Smith x_r = x_l + 1.0; 1307f1af5d2fSBarry Smith for (i=0; i<m; i++) { 1308f1af5d2fSBarry Smith y_l = m - i - 1.0; 1309f1af5d2fSBarry Smith y_r = y_l + 1.0; 1310b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(v[j*m+i]),minv,maxv); 1311b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1312f1af5d2fSBarry Smith } 1313f1af5d2fSBarry Smith } 1314383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1315f1af5d2fSBarry Smith } 1316ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 1317f1af5d2fSBarry Smith PetscFunctionReturn(0); 1318f1af5d2fSBarry Smith } 1319f1af5d2fSBarry Smith 1320e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1321f1af5d2fSBarry Smith { 1322b0a32e0cSBarry Smith PetscDraw draw; 1323ace3abfcSBarry Smith PetscBool isnull; 1324329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1325dfbe8321SBarry Smith PetscErrorCode ierr; 1326f1af5d2fSBarry Smith 1327f1af5d2fSBarry Smith PetscFunctionBegin; 1328b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1329b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1330abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1331f1af5d2fSBarry Smith 1332d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1333f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1334b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1335832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1336b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 13370298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1338832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 1339f1af5d2fSBarry Smith PetscFunctionReturn(0); 1340f1af5d2fSBarry Smith } 1341f1af5d2fSBarry Smith 1342dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1343932b0c3eSLois Curfman McInnes { 1344dfbe8321SBarry Smith PetscErrorCode ierr; 1345ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1346932b0c3eSLois Curfman McInnes 13473a40ed3dSBarry Smith PetscFunctionBegin; 1348251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1349251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1350251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 13510f5bd95cSBarry Smith 1352c45a1595SBarry Smith if (iascii) { 1353c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 13540f5bd95cSBarry Smith } else if (isbinary) { 1355637a0070SStefano Zampini ierr = MatView_Dense_Binary(A,viewer);CHKERRQ(ierr); 1356f1af5d2fSBarry Smith } else if (isdraw) { 1357f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 1358932b0c3eSLois Curfman McInnes } 13593a40ed3dSBarry Smith PetscFunctionReturn(0); 1360932b0c3eSLois Curfman McInnes } 1361289bc588SBarry Smith 1362637a0070SStefano Zampini static PetscErrorCode MatDensePlaceArray_SeqDense(Mat A,const PetscScalar *array) 1363d3042a70SBarry Smith { 1364d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1365d3042a70SBarry Smith 1366d3042a70SBarry Smith PetscFunctionBegin; 13676947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1368d5ea218eSStefano Zampini if (a->unplacedarray) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreArray first"); 1369d3042a70SBarry Smith a->unplacedarray = a->v; 1370d3042a70SBarry Smith a->unplaced_user_alloc = a->user_alloc; 1371d3042a70SBarry Smith a->v = (PetscScalar*) array; 1372637a0070SStefano Zampini a->user_alloc = PETSC_TRUE; 1373ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1374c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1375ca15aa20SStefano Zampini #endif 1376d3042a70SBarry Smith PetscFunctionReturn(0); 1377d3042a70SBarry Smith } 1378d3042a70SBarry Smith 1379d3042a70SBarry Smith static PetscErrorCode MatDenseResetArray_SeqDense(Mat A) 1380d3042a70SBarry Smith { 1381d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1382d3042a70SBarry Smith 1383d3042a70SBarry Smith PetscFunctionBegin; 13846947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1385d3042a70SBarry Smith a->v = a->unplacedarray; 1386d3042a70SBarry Smith a->user_alloc = a->unplaced_user_alloc; 1387d3042a70SBarry Smith a->unplacedarray = NULL; 1388ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1389c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1390ca15aa20SStefano Zampini #endif 1391d3042a70SBarry Smith PetscFunctionReturn(0); 1392d3042a70SBarry Smith } 1393d3042a70SBarry Smith 1394d5ea218eSStefano Zampini static PetscErrorCode MatDenseReplaceArray_SeqDense(Mat A,const PetscScalar *array) 1395d5ea218eSStefano Zampini { 1396d5ea218eSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1397d5ea218eSStefano Zampini PetscErrorCode ierr; 1398d5ea218eSStefano Zampini 1399d5ea218eSStefano Zampini PetscFunctionBegin; 1400d5ea218eSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1401d5ea218eSStefano Zampini if (!a->user_alloc) { ierr = PetscFree(a->v);CHKERRQ(ierr); } 1402d5ea218eSStefano Zampini a->v = (PetscScalar*) array; 1403d5ea218eSStefano Zampini a->user_alloc = PETSC_FALSE; 1404d5ea218eSStefano Zampini #if defined(PETSC_HAVE_CUDA) 1405d5ea218eSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1406d5ea218eSStefano Zampini #endif 1407d5ea218eSStefano Zampini PetscFunctionReturn(0); 1408d5ea218eSStefano Zampini } 1409d5ea218eSStefano Zampini 1410ca15aa20SStefano Zampini PetscErrorCode MatDestroy_SeqDense(Mat mat) 1411289bc588SBarry Smith { 1412ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1413dfbe8321SBarry Smith PetscErrorCode ierr; 141490f02eecSBarry Smith 14153a40ed3dSBarry Smith PetscFunctionBegin; 1416aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1417d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1418a5a9c739SBarry Smith #endif 141905b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 1420a49dc2a2SStefano Zampini ierr = PetscFree(l->fwork);CHKERRQ(ierr); 1421abc3b08eSStefano Zampini ierr = MatDestroy(&l->ptapwork);CHKERRQ(ierr); 14226857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1423637a0070SStefano Zampini if (!l->unplaced_user_alloc) {ierr = PetscFree(l->unplacedarray);CHKERRQ(ierr);} 14246947451fSStefano Zampini ierr = VecDestroy(&l->cvec);CHKERRQ(ierr); 1425bf0cc555SLisandro Dalcin ierr = PetscFree(mat->data);CHKERRQ(ierr); 1426dbd8c25aSHong Zhang 1427dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 142849a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetLDA_C",NULL);CHKERRQ(ierr); 1429ad16ce7aSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseSetLDA_C",NULL);CHKERRQ(ierr); 1430bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArray_C",NULL);CHKERRQ(ierr); 143152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArray_C",NULL);CHKERRQ(ierr); 1432d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDensePlaceArray_C",NULL);CHKERRQ(ierr); 1433d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseResetArray_C",NULL);CHKERRQ(ierr); 1434d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseReplaceArray_C",NULL);CHKERRQ(ierr); 143552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayRead_C",NULL);CHKERRQ(ierr); 143652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayRead_C",NULL);CHKERRQ(ierr); 14376947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayWrite_C",NULL);CHKERRQ(ierr); 14386947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayWrite_C",NULL);CHKERRQ(ierr); 14398baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 14408baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 14418baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_elemental_C",NULL);CHKERRQ(ierr); 14428baccfbdSHong Zhang #endif 14432bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 14442bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqdensecuda_C",NULL);CHKERRQ(ierr); 14454222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",NULL);CHKERRQ(ierr); 14464222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdense_C",NULL);CHKERRQ(ierr); 14474222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",NULL);CHKERRQ(ierr); 14482bf066beSStefano Zampini #endif 1449bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatSeqDenseSetPreallocation_C",NULL);CHKERRQ(ierr); 14504222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14514222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdense_seqdense_C",NULL);CHKERRQ(ierr); 14524222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 14534222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 145452c5f739Sprj- 145586aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumn_C",NULL);CHKERRQ(ierr); 145686aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumn_C",NULL);CHKERRQ(ierr); 14576947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVec_C",NULL);CHKERRQ(ierr); 14586947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVec_C",NULL);CHKERRQ(ierr); 14596947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecRead_C",NULL);CHKERRQ(ierr); 14606947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecRead_C",NULL);CHKERRQ(ierr); 14616947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecWrite_C",NULL);CHKERRQ(ierr); 14626947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecWrite_C",NULL);CHKERRQ(ierr); 14633a40ed3dSBarry Smith PetscFunctionReturn(0); 1464289bc588SBarry Smith } 1465289bc588SBarry Smith 1466e0877f53SBarry Smith static PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1467289bc588SBarry Smith { 1468c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 14696849ba73SBarry Smith PetscErrorCode ierr; 147013f74950SBarry Smith PetscInt k,j,m,n,M; 147187828ca2SBarry Smith PetscScalar *v,tmp; 147248b35521SBarry Smith 14733a40ed3dSBarry Smith PetscFunctionBegin; 1474ca15aa20SStefano Zampini m = A->rmap->n; M = mat->lda; n = A->cmap->n; 14752847e3fdSStefano Zampini if (reuse == MAT_INPLACE_MATRIX && m == n) { /* in place transpose */ 1476ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1477d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1478289bc588SBarry Smith for (k=0; k<j; k++) { 14791b807ce4Svictorle tmp = v[j + k*M]; 14801b807ce4Svictorle v[j + k*M] = v[k + j*M]; 14811b807ce4Svictorle v[k + j*M] = tmp; 1482289bc588SBarry Smith } 1483289bc588SBarry Smith } 1484ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 14853a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1486d3e5ee88SLois Curfman McInnes Mat tmat; 1487ec8511deSBarry Smith Mat_SeqDense *tmatd; 148887828ca2SBarry Smith PetscScalar *v2; 1489af36a384SStefano Zampini PetscInt M2; 1490ea709b57SSatish Balay 14912847e3fdSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 1492ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&tmat);CHKERRQ(ierr); 1493d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 14947adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 14950298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(tmat,NULL);CHKERRQ(ierr); 1496ca15aa20SStefano Zampini } else tmat = *matout; 1497ca15aa20SStefano Zampini 1498ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 1499ca15aa20SStefano Zampini ierr = MatDenseGetArray(tmat,&v2);CHKERRQ(ierr); 1500ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 1501ca15aa20SStefano Zampini M2 = tmatd->lda; 1502d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 1503af36a384SStefano Zampini for (k=0; k<m; k++) v2[j + k*M2] = v[k + j*M]; 1504d3e5ee88SLois Curfman McInnes } 1505ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(tmat,&v2);CHKERRQ(ierr); 1506ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 15076d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15086d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15092847e3fdSStefano Zampini if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) *matout = tmat; 15102847e3fdSStefano Zampini else { 15112847e3fdSStefano Zampini ierr = MatHeaderMerge(A,&tmat);CHKERRQ(ierr); 15122847e3fdSStefano Zampini } 151348b35521SBarry Smith } 15143a40ed3dSBarry Smith PetscFunctionReturn(0); 1515289bc588SBarry Smith } 1516289bc588SBarry Smith 1517e0877f53SBarry Smith static PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1518289bc588SBarry Smith { 1519c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1520c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 1521ca15aa20SStefano Zampini PetscInt i; 1522ca15aa20SStefano Zampini const PetscScalar *v1,*v2; 1523ca15aa20SStefano Zampini PetscErrorCode ierr; 15249ea5d5aeSSatish Balay 15253a40ed3dSBarry Smith PetscFunctionBegin; 1526d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1527d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1528ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A1,&v1);CHKERRQ(ierr); 1529ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A2,&v2);CHKERRQ(ierr); 1530ca15aa20SStefano Zampini for (i=0; i<A1->cmap->n; i++) { 1531ca15aa20SStefano Zampini ierr = PetscArraycmp(v1,v2,A1->rmap->n,flg);CHKERRQ(ierr); 1532ca15aa20SStefano Zampini if (*flg == PETSC_FALSE) PetscFunctionReturn(0); 1533ca15aa20SStefano Zampini v1 += mat1->lda; 1534ca15aa20SStefano Zampini v2 += mat2->lda; 15351b807ce4Svictorle } 1536ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A1,&v1);CHKERRQ(ierr); 1537ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A2,&v2);CHKERRQ(ierr); 153877c4ece6SBarry Smith *flg = PETSC_TRUE; 15393a40ed3dSBarry Smith PetscFunctionReturn(0); 1540289bc588SBarry Smith } 1541289bc588SBarry Smith 1542e0877f53SBarry Smith static PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1543289bc588SBarry Smith { 1544c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 154513f74950SBarry Smith PetscInt i,n,len; 1546ca15aa20SStefano Zampini PetscScalar *x; 1547ca15aa20SStefano Zampini const PetscScalar *vv; 1548ca15aa20SStefano Zampini PetscErrorCode ierr; 154944cd7ae7SLois Curfman McInnes 15503a40ed3dSBarry Smith PetscFunctionBegin; 15517a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 15521ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1553d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1554ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1555e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 155644cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 1557ca15aa20SStefano Zampini x[i] = vv[i*mat->lda + i]; 1558289bc588SBarry Smith } 1559ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 15601ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 15613a40ed3dSBarry Smith PetscFunctionReturn(0); 1562289bc588SBarry Smith } 1563289bc588SBarry Smith 1564e0877f53SBarry Smith static PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1565289bc588SBarry Smith { 1566c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1567f1ceaac6SMatthew G. Knepley const PetscScalar *l,*r; 1568ca15aa20SStefano Zampini PetscScalar x,*v,*vv; 1569dfbe8321SBarry Smith PetscErrorCode ierr; 1570d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 157155659b69SBarry Smith 15723a40ed3dSBarry Smith PetscFunctionBegin; 1573ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&vv);CHKERRQ(ierr); 157428988994SBarry Smith if (ll) { 15757a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 1576f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 1577e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1578da3a660dSBarry Smith for (i=0; i<m; i++) { 1579da3a660dSBarry Smith x = l[i]; 1580ca15aa20SStefano Zampini v = vv + i; 1581b43bac26SStefano Zampini for (j=0; j<n; j++) { (*v) *= x; v+= mat->lda;} 1582da3a660dSBarry Smith } 1583f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 1584eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1585da3a660dSBarry Smith } 158628988994SBarry Smith if (rr) { 15877a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 1588f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 1589e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1590da3a660dSBarry Smith for (i=0; i<n; i++) { 1591da3a660dSBarry Smith x = r[i]; 1592ca15aa20SStefano Zampini v = vv + i*mat->lda; 15932205254eSKarl Rupp for (j=0; j<m; j++) (*v++) *= x; 1594da3a660dSBarry Smith } 1595f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 1596eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1597da3a660dSBarry Smith } 1598ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&vv);CHKERRQ(ierr); 15993a40ed3dSBarry Smith PetscFunctionReturn(0); 1600289bc588SBarry Smith } 1601289bc588SBarry Smith 1602ca15aa20SStefano Zampini PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1603289bc588SBarry Smith { 1604c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1605ca15aa20SStefano Zampini PetscScalar *v,*vv; 1606329f5518SBarry Smith PetscReal sum = 0.0; 1607d0f46423SBarry Smith PetscInt lda =mat->lda,m=A->rmap->n,i,j; 1608efee365bSSatish Balay PetscErrorCode ierr; 160955659b69SBarry Smith 16103a40ed3dSBarry Smith PetscFunctionBegin; 1611ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 1612ca15aa20SStefano Zampini v = vv; 1613289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1614a5ce6ee0Svictorle if (lda>m) { 1615d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1616ca15aa20SStefano Zampini v = vv+j*lda; 1617a5ce6ee0Svictorle for (i=0; i<m; i++) { 1618a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1619a5ce6ee0Svictorle } 1620a5ce6ee0Svictorle } 1621a5ce6ee0Svictorle } else { 1622570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 1623570b7f6dSBarry Smith PetscBLASInt one = 1,cnt = A->cmap->n*A->rmap->n; 1624570b7f6dSBarry Smith *nrm = BLASnrm2_(&cnt,v,&one); 1625570b7f6dSBarry Smith } 1626570b7f6dSBarry Smith #else 1627d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1628329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1629289bc588SBarry Smith } 1630a5ce6ee0Svictorle } 16318f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 1632570b7f6dSBarry Smith #endif 1633dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16343a40ed3dSBarry Smith } else if (type == NORM_1) { 1635064f8208SBarry Smith *nrm = 0.0; 1636d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1637ca15aa20SStefano Zampini v = vv + j*mat->lda; 1638289bc588SBarry Smith sum = 0.0; 1639d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 164033a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1641289bc588SBarry Smith } 1642064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1643289bc588SBarry Smith } 1644eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16453a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1646064f8208SBarry Smith *nrm = 0.0; 1647d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1648ca15aa20SStefano Zampini v = vv + j; 1649289bc588SBarry Smith sum = 0.0; 1650d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 16511b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1652289bc588SBarry Smith } 1653064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1654289bc588SBarry Smith } 1655eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1656e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 1657ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 16583a40ed3dSBarry Smith PetscFunctionReturn(0); 1659289bc588SBarry Smith } 1660289bc588SBarry Smith 1661e0877f53SBarry Smith static PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1662289bc588SBarry Smith { 1663c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 166463ba0a88SBarry Smith PetscErrorCode ierr; 166567e560aaSBarry Smith 16663a40ed3dSBarry Smith PetscFunctionBegin; 1667b5a2b587SKris Buschelman switch (op) { 1668b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 16694e0d8c25SBarry Smith aij->roworiented = flg; 1670b5a2b587SKris Buschelman break; 1671512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1672b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 16733971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 16744e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 167513fa8e87SLisandro Dalcin case MAT_KEEP_NONZERO_PATTERN: 1676b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1677b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 16780f8fb01aSBarry Smith case MAT_IGNORE_ZERO_ENTRIES: 16795021d80fSJed Brown case MAT_IGNORE_LOWER_TRIANGULAR: 1680071fcb05SBarry Smith case MAT_SORTED_FULL: 16815021d80fSJed Brown ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 16825021d80fSJed Brown break; 16835021d80fSJed Brown case MAT_SPD: 168477e54ba9SKris Buschelman case MAT_SYMMETRIC: 168577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 16869a4540c5SBarry Smith case MAT_HERMITIAN: 16879a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 16885021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 168977e54ba9SKris Buschelman break; 1690b5a2b587SKris Buschelman default: 1691e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 16923a40ed3dSBarry Smith } 16933a40ed3dSBarry Smith PetscFunctionReturn(0); 1694289bc588SBarry Smith } 1695289bc588SBarry Smith 1696e0877f53SBarry Smith static PetscErrorCode MatZeroEntries_SeqDense(Mat A) 16976f0a148fSBarry Smith { 1698ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 16996849ba73SBarry Smith PetscErrorCode ierr; 1700d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 1701ca15aa20SStefano Zampini PetscScalar *v; 17023a40ed3dSBarry Smith 17033a40ed3dSBarry Smith PetscFunctionBegin; 1704ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1705a5ce6ee0Svictorle if (lda>m) { 1706d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1707ca15aa20SStefano Zampini ierr = PetscArrayzero(v+j*lda,m);CHKERRQ(ierr); 1708a5ce6ee0Svictorle } 1709a5ce6ee0Svictorle } else { 1710ca15aa20SStefano Zampini ierr = PetscArrayzero(v,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 1711a5ce6ee0Svictorle } 1712ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17133a40ed3dSBarry Smith PetscFunctionReturn(0); 17146f0a148fSBarry Smith } 17156f0a148fSBarry Smith 1716e0877f53SBarry Smith static PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17176f0a148fSBarry Smith { 171897b48c8fSBarry Smith PetscErrorCode ierr; 1719ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1720b9679d65SBarry Smith PetscInt m = l->lda, n = A->cmap->n, i,j; 1721ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 172297b48c8fSBarry Smith const PetscScalar *xx; 172355659b69SBarry Smith 17243a40ed3dSBarry Smith PetscFunctionBegin; 172576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1726b9679d65SBarry Smith for (i=0; i<N; i++) { 1727b9679d65SBarry Smith if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1728b9679d65SBarry Smith if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1729b9679d65SBarry Smith } 173076bd3646SJed Brown } 1731ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1732b9679d65SBarry Smith 173397b48c8fSBarry Smith /* fix right hand side if needed */ 173497b48c8fSBarry Smith if (x && b) { 173597b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 173697b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17372205254eSKarl Rupp for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 173897b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 173997b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 174097b48c8fSBarry Smith } 174197b48c8fSBarry Smith 1742ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 17436f0a148fSBarry Smith for (i=0; i<N; i++) { 1744ca15aa20SStefano Zampini slot = v + rows[i]; 1745b9679d65SBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 17466f0a148fSBarry Smith } 1747f4df32b1SMatthew Knepley if (diag != 0.0) { 1748b9679d65SBarry Smith if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 17496f0a148fSBarry Smith for (i=0; i<N; i++) { 1750ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1751f4df32b1SMatthew Knepley *slot = diag; 17526f0a148fSBarry Smith } 17536f0a148fSBarry Smith } 1754ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17553a40ed3dSBarry Smith PetscFunctionReturn(0); 17566f0a148fSBarry Smith } 1757557bce09SLois Curfman McInnes 175849a6ff4bSBarry Smith static PetscErrorCode MatDenseGetLDA_SeqDense(Mat A,PetscInt *lda) 175949a6ff4bSBarry Smith { 176049a6ff4bSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 176149a6ff4bSBarry Smith 176249a6ff4bSBarry Smith PetscFunctionBegin; 176349a6ff4bSBarry Smith *lda = mat->lda; 176449a6ff4bSBarry Smith PetscFunctionReturn(0); 176549a6ff4bSBarry Smith } 176649a6ff4bSBarry Smith 1767637a0070SStefano Zampini PetscErrorCode MatDenseGetArray_SeqDense(Mat A,PetscScalar **array) 176864e87e97SBarry Smith { 1769c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 17703a40ed3dSBarry Smith 17713a40ed3dSBarry Smith PetscFunctionBegin; 177264e87e97SBarry Smith *array = mat->v; 17733a40ed3dSBarry Smith PetscFunctionReturn(0); 177464e87e97SBarry Smith } 17750754003eSLois Curfman McInnes 1776637a0070SStefano Zampini PetscErrorCode MatDenseRestoreArray_SeqDense(Mat A,PetscScalar **array) 1777ff14e315SSatish Balay { 17783a40ed3dSBarry Smith PetscFunctionBegin; 1779637a0070SStefano Zampini *array = NULL; 17803a40ed3dSBarry Smith PetscFunctionReturn(0); 1781ff14e315SSatish Balay } 17820754003eSLois Curfman McInnes 1783dec5eb66SMatthew G Knepley /*@C 178449a6ff4bSBarry Smith MatDenseGetLDA - gets the leading dimension of the array returned from MatDenseGetArray() 178549a6ff4bSBarry Smith 1786ad16ce7aSStefano Zampini Not collective 178749a6ff4bSBarry Smith 178849a6ff4bSBarry Smith Input Parameter: 178949a6ff4bSBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 179049a6ff4bSBarry Smith 179149a6ff4bSBarry Smith Output Parameter: 179249a6ff4bSBarry Smith . lda - the leading dimension 179349a6ff4bSBarry Smith 179449a6ff4bSBarry Smith Level: intermediate 179549a6ff4bSBarry Smith 1796ad16ce7aSStefano Zampini .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseSetLDA() 179749a6ff4bSBarry Smith @*/ 179849a6ff4bSBarry Smith PetscErrorCode MatDenseGetLDA(Mat A,PetscInt *lda) 179949a6ff4bSBarry Smith { 180049a6ff4bSBarry Smith PetscErrorCode ierr; 180149a6ff4bSBarry Smith 180249a6ff4bSBarry Smith PetscFunctionBegin; 1803d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1804d5ea218eSStefano Zampini PetscValidPointer(lda,2); 180549a6ff4bSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetLDA_C",(Mat,PetscInt*),(A,lda));CHKERRQ(ierr); 180649a6ff4bSBarry Smith PetscFunctionReturn(0); 180749a6ff4bSBarry Smith } 180849a6ff4bSBarry Smith 180949a6ff4bSBarry Smith /*@C 1810ad16ce7aSStefano Zampini MatDenseSetLDA - Sets the leading dimension of the array used by the dense matrix 1811ad16ce7aSStefano Zampini 1812ad16ce7aSStefano Zampini Not collective 1813ad16ce7aSStefano Zampini 1814ad16ce7aSStefano Zampini Input Parameter: 1815ad16ce7aSStefano Zampini + mat - a MATSEQDENSE or MATMPIDENSE matrix 1816ad16ce7aSStefano Zampini - lda - the leading dimension 1817ad16ce7aSStefano Zampini 1818ad16ce7aSStefano Zampini Level: intermediate 1819ad16ce7aSStefano Zampini 1820ad16ce7aSStefano Zampini .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetLDA() 1821ad16ce7aSStefano Zampini @*/ 1822ad16ce7aSStefano Zampini PetscErrorCode MatDenseSetLDA(Mat A,PetscInt lda) 1823ad16ce7aSStefano Zampini { 1824ad16ce7aSStefano Zampini PetscErrorCode ierr; 1825ad16ce7aSStefano Zampini 1826ad16ce7aSStefano Zampini PetscFunctionBegin; 1827ad16ce7aSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1828ad16ce7aSStefano Zampini ierr = PetscTryMethod(A,"MatDenseSetLDA_C",(Mat,PetscInt),(A,lda));CHKERRQ(ierr); 1829ad16ce7aSStefano Zampini PetscFunctionReturn(0); 1830ad16ce7aSStefano Zampini } 1831ad16ce7aSStefano Zampini 1832ad16ce7aSStefano Zampini /*@C 18336947451fSStefano Zampini MatDenseGetArray - gives read-write access to the array where the data for a dense matrix is stored 183473a71a0fSBarry Smith 18358572280aSBarry Smith Logically Collective on Mat 183673a71a0fSBarry Smith 183773a71a0fSBarry Smith Input Parameter: 18386947451fSStefano Zampini . mat - a dense matrix 183973a71a0fSBarry Smith 184073a71a0fSBarry Smith Output Parameter: 184173a71a0fSBarry Smith . array - pointer to the data 184273a71a0fSBarry Smith 184373a71a0fSBarry Smith Level: intermediate 184473a71a0fSBarry Smith 18456947451fSStefano Zampini .seealso: MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 184673a71a0fSBarry Smith @*/ 18478c778c55SBarry Smith PetscErrorCode MatDenseGetArray(Mat A,PetscScalar **array) 184873a71a0fSBarry Smith { 184973a71a0fSBarry Smith PetscErrorCode ierr; 185073a71a0fSBarry Smith 185173a71a0fSBarry Smith PetscFunctionBegin; 1852d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1853d5ea218eSStefano Zampini PetscValidPointer(array,2); 18548c778c55SBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 185573a71a0fSBarry Smith PetscFunctionReturn(0); 185673a71a0fSBarry Smith } 185773a71a0fSBarry Smith 1858dec5eb66SMatthew G Knepley /*@C 1859579dbff0SBarry Smith MatDenseRestoreArray - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArray() 186073a71a0fSBarry Smith 18618572280aSBarry Smith Logically Collective on Mat 18628572280aSBarry Smith 18638572280aSBarry Smith Input Parameters: 18646947451fSStefano Zampini + mat - a dense matrix 1865a2b725a8SWilliam Gropp - array - pointer to the data 18668572280aSBarry Smith 18678572280aSBarry Smith Level: intermediate 18688572280aSBarry Smith 18696947451fSStefano Zampini .seealso: MatDenseGetArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 18708572280aSBarry Smith @*/ 18718572280aSBarry Smith PetscErrorCode MatDenseRestoreArray(Mat A,PetscScalar **array) 18728572280aSBarry Smith { 18738572280aSBarry Smith PetscErrorCode ierr; 18748572280aSBarry Smith 18758572280aSBarry Smith PetscFunctionBegin; 1876d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1877d5ea218eSStefano Zampini PetscValidPointer(array,2); 18788572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 18798572280aSBarry Smith ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 1880637a0070SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1881637a0070SStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1882637a0070SStefano Zampini #endif 18838572280aSBarry Smith PetscFunctionReturn(0); 18848572280aSBarry Smith } 18858572280aSBarry Smith 18868572280aSBarry Smith /*@C 18876947451fSStefano Zampini MatDenseGetArrayRead - gives read-only access to the array where the data for a dense matrix is stored 18888572280aSBarry Smith 18898572280aSBarry Smith Not Collective 18908572280aSBarry Smith 18918572280aSBarry Smith Input Parameter: 18926947451fSStefano Zampini . mat - a dense matrix 18938572280aSBarry Smith 18948572280aSBarry Smith Output Parameter: 18958572280aSBarry Smith . array - pointer to the data 18968572280aSBarry Smith 18978572280aSBarry Smith Level: intermediate 18988572280aSBarry Smith 18996947451fSStefano Zampini .seealso: MatDenseRestoreArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 19008572280aSBarry Smith @*/ 19018572280aSBarry Smith PetscErrorCode MatDenseGetArrayRead(Mat A,const PetscScalar **array) 19028572280aSBarry Smith { 19038572280aSBarry Smith PetscErrorCode ierr; 19048572280aSBarry Smith 19058572280aSBarry Smith PetscFunctionBegin; 1906d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1907d5ea218eSStefano Zampini PetscValidPointer(array,2); 19088572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 19098572280aSBarry Smith PetscFunctionReturn(0); 19108572280aSBarry Smith } 19118572280aSBarry Smith 19128572280aSBarry Smith /*@C 19136947451fSStefano Zampini MatDenseRestoreArrayRead - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayRead() 19148572280aSBarry Smith 191573a71a0fSBarry Smith Not Collective 191673a71a0fSBarry Smith 191773a71a0fSBarry Smith Input Parameters: 19186947451fSStefano Zampini + mat - a dense matrix 1919a2b725a8SWilliam Gropp - array - pointer to the data 192073a71a0fSBarry Smith 192173a71a0fSBarry Smith Level: intermediate 192273a71a0fSBarry Smith 19236947451fSStefano Zampini .seealso: MatDenseGetArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 192473a71a0fSBarry Smith @*/ 19258572280aSBarry Smith PetscErrorCode MatDenseRestoreArrayRead(Mat A,const PetscScalar **array) 192673a71a0fSBarry Smith { 192773a71a0fSBarry Smith PetscErrorCode ierr; 192873a71a0fSBarry Smith 192973a71a0fSBarry Smith PetscFunctionBegin; 1930d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1931d5ea218eSStefano Zampini PetscValidPointer(array,2); 19328572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 193373a71a0fSBarry Smith PetscFunctionReturn(0); 193473a71a0fSBarry Smith } 193573a71a0fSBarry Smith 19366947451fSStefano Zampini /*@C 19376947451fSStefano Zampini MatDenseGetArrayWrite - gives write-only access to the array where the data for a dense matrix is stored 19386947451fSStefano Zampini 19396947451fSStefano Zampini Not Collective 19406947451fSStefano Zampini 19416947451fSStefano Zampini Input Parameter: 19426947451fSStefano Zampini . mat - a dense matrix 19436947451fSStefano Zampini 19446947451fSStefano Zampini Output Parameter: 19456947451fSStefano Zampini . array - pointer to the data 19466947451fSStefano Zampini 19476947451fSStefano Zampini Level: intermediate 19486947451fSStefano Zampini 19496947451fSStefano Zampini .seealso: MatDenseRestoreArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19506947451fSStefano Zampini @*/ 19516947451fSStefano Zampini PetscErrorCode MatDenseGetArrayWrite(Mat A,PetscScalar **array) 19526947451fSStefano Zampini { 19536947451fSStefano Zampini PetscErrorCode ierr; 19546947451fSStefano Zampini 19556947451fSStefano Zampini PetscFunctionBegin; 1956d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1957d5ea218eSStefano Zampini PetscValidPointer(array,2); 19586947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19596947451fSStefano Zampini PetscFunctionReturn(0); 19606947451fSStefano Zampini } 19616947451fSStefano Zampini 19626947451fSStefano Zampini /*@C 19636947451fSStefano Zampini MatDenseRestoreArrayWrite - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayWrite() 19646947451fSStefano Zampini 19656947451fSStefano Zampini Not Collective 19666947451fSStefano Zampini 19676947451fSStefano Zampini Input Parameters: 19686947451fSStefano Zampini + mat - a dense matrix 19696947451fSStefano Zampini - array - pointer to the data 19706947451fSStefano Zampini 19716947451fSStefano Zampini Level: intermediate 19726947451fSStefano Zampini 19736947451fSStefano Zampini .seealso: MatDenseGetArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19746947451fSStefano Zampini @*/ 19756947451fSStefano Zampini PetscErrorCode MatDenseRestoreArrayWrite(Mat A,PetscScalar **array) 19766947451fSStefano Zampini { 19776947451fSStefano Zampini PetscErrorCode ierr; 19786947451fSStefano Zampini 19796947451fSStefano Zampini PetscFunctionBegin; 1980d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1981d5ea218eSStefano Zampini PetscValidPointer(array,2); 19826947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19836947451fSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 19846947451fSStefano Zampini #if defined(PETSC_HAVE_CUDA) 19856947451fSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 19866947451fSStefano Zampini #endif 19876947451fSStefano Zampini PetscFunctionReturn(0); 19886947451fSStefano Zampini } 19896947451fSStefano Zampini 19907dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 19910754003eSLois Curfman McInnes { 1992c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 19936849ba73SBarry Smith PetscErrorCode ierr; 1994ca15aa20SStefano Zampini PetscInt i,j,nrows,ncols,blda; 19955d0c19d7SBarry Smith const PetscInt *irow,*icol; 199687828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 19970754003eSLois Curfman McInnes Mat newmat; 19980754003eSLois Curfman McInnes 19993a40ed3dSBarry Smith PetscFunctionBegin; 200078b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 200178b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 2002e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2003e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 20040754003eSLois Curfman McInnes 2005182d2002SSatish Balay /* Check submatrixcall */ 2006182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 200713f74950SBarry Smith PetscInt n_cols,n_rows; 2008182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 200921a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 2010f746d493SDmitry Karpeev /* resize the result matrix to match number of requested rows/columns */ 2011c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 201221a2c019SBarry Smith } 2013182d2002SSatish Balay newmat = *B; 2014182d2002SSatish Balay } else { 20150754003eSLois Curfman McInnes /* Create and fill new matrix */ 2016ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&newmat);CHKERRQ(ierr); 2017f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 20187adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 20190298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newmat,NULL);CHKERRQ(ierr); 2020182d2002SSatish Balay } 2021182d2002SSatish Balay 2022182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 2023ca15aa20SStefano Zampini ierr = MatDenseGetArray(newmat,&bv);CHKERRQ(ierr); 2024ca15aa20SStefano Zampini ierr = MatDenseGetLDA(newmat,&blda);CHKERRQ(ierr); 2025182d2002SSatish Balay for (i=0; i<ncols; i++) { 20266de62eeeSBarry Smith av = v + mat->lda*icol[i]; 2027ca15aa20SStefano Zampini for (j=0; j<nrows; j++) bv[j] = av[irow[j]]; 2028ca15aa20SStefano Zampini bv += blda; 20290754003eSLois Curfman McInnes } 2030ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newmat,&bv);CHKERRQ(ierr); 2031182d2002SSatish Balay 2032182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 20336d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20346d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20350754003eSLois Curfman McInnes 20360754003eSLois Curfman McInnes /* Free work space */ 203778b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 203878b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2039182d2002SSatish Balay *B = newmat; 20403a40ed3dSBarry Smith PetscFunctionReturn(0); 20410754003eSLois Curfman McInnes } 20420754003eSLois Curfman McInnes 20437dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2044905e6a2fSBarry Smith { 20456849ba73SBarry Smith PetscErrorCode ierr; 204613f74950SBarry Smith PetscInt i; 2047905e6a2fSBarry Smith 20483a40ed3dSBarry Smith PetscFunctionBegin; 2049905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2050df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2051905e6a2fSBarry Smith } 2052905e6a2fSBarry Smith 2053905e6a2fSBarry Smith for (i=0; i<n; i++) { 20547dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2055905e6a2fSBarry Smith } 20563a40ed3dSBarry Smith PetscFunctionReturn(0); 2057905e6a2fSBarry Smith } 2058905e6a2fSBarry Smith 2059e0877f53SBarry Smith static PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 2060c0aa2d19SHong Zhang { 2061c0aa2d19SHong Zhang PetscFunctionBegin; 2062c0aa2d19SHong Zhang PetscFunctionReturn(0); 2063c0aa2d19SHong Zhang } 2064c0aa2d19SHong Zhang 2065e0877f53SBarry Smith static PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 2066c0aa2d19SHong Zhang { 2067c0aa2d19SHong Zhang PetscFunctionBegin; 2068c0aa2d19SHong Zhang PetscFunctionReturn(0); 2069c0aa2d19SHong Zhang } 2070c0aa2d19SHong Zhang 2071e0877f53SBarry Smith static PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 20724b0e389bSBarry Smith { 20734b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense*)B->data; 20746849ba73SBarry Smith PetscErrorCode ierr; 2075ca15aa20SStefano Zampini const PetscScalar *va; 2076ca15aa20SStefano Zampini PetscScalar *vb; 2077d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 20783a40ed3dSBarry Smith 20793a40ed3dSBarry Smith PetscFunctionBegin; 208033f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 208133f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 2082cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 20833a40ed3dSBarry Smith PetscFunctionReturn(0); 20843a40ed3dSBarry Smith } 2085e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 2086ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&va);CHKERRQ(ierr); 2087ca15aa20SStefano Zampini ierr = MatDenseGetArray(B,&vb);CHKERRQ(ierr); 2088a5ce6ee0Svictorle if (lda1>m || lda2>m) { 20890dbb7854Svictorle for (j=0; j<n; j++) { 2090ca15aa20SStefano Zampini ierr = PetscArraycpy(vb+j*lda2,va+j*lda1,m);CHKERRQ(ierr); 2091a5ce6ee0Svictorle } 2092a5ce6ee0Svictorle } else { 2093ca15aa20SStefano Zampini ierr = PetscArraycpy(vb,va,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 2094a5ce6ee0Svictorle } 2095ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(B,&vb);CHKERRQ(ierr); 2096ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&va);CHKERRQ(ierr); 2097ca15aa20SStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2098ca15aa20SStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2099273d9f13SBarry Smith PetscFunctionReturn(0); 2100273d9f13SBarry Smith } 2101273d9f13SBarry Smith 2102e0877f53SBarry Smith static PetscErrorCode MatSetUp_SeqDense(Mat A) 2103273d9f13SBarry Smith { 2104dfbe8321SBarry Smith PetscErrorCode ierr; 2105273d9f13SBarry Smith 2106273d9f13SBarry Smith PetscFunctionBegin; 210718992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr); 210818992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr); 210918992e5dSStefano Zampini if (!A->preallocated) { 2110273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 211118992e5dSStefano Zampini } 21123a40ed3dSBarry Smith PetscFunctionReturn(0); 21134b0e389bSBarry Smith } 21144b0e389bSBarry Smith 2115ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 2116ba337c44SJed Brown { 2117ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2118ca15aa20SStefano Zampini PetscScalar *aa; 2119ca15aa20SStefano Zampini PetscErrorCode ierr; 2120ba337c44SJed Brown 2121ba337c44SJed Brown PetscFunctionBegin; 2122ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2123ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 2124ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2125ba337c44SJed Brown PetscFunctionReturn(0); 2126ba337c44SJed Brown } 2127ba337c44SJed Brown 2128ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 2129ba337c44SJed Brown { 2130ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2131ca15aa20SStefano Zampini PetscScalar *aa; 2132ca15aa20SStefano Zampini PetscErrorCode ierr; 2133ba337c44SJed Brown 2134ba337c44SJed Brown PetscFunctionBegin; 2135ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2136ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 2137ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2138ba337c44SJed Brown PetscFunctionReturn(0); 2139ba337c44SJed Brown } 2140ba337c44SJed Brown 2141ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 2142ba337c44SJed Brown { 2143ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2144ca15aa20SStefano Zampini PetscScalar *aa; 2145ca15aa20SStefano Zampini PetscErrorCode ierr; 2146ba337c44SJed Brown 2147ba337c44SJed Brown PetscFunctionBegin; 2148ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2149ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 2150ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2151ba337c44SJed Brown PetscFunctionReturn(0); 2152ba337c44SJed Brown } 2153284134d9SBarry Smith 2154a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 21554222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2156a9fe9ddaSSatish Balay { 2157ee16a9a1SHong Zhang PetscErrorCode ierr; 2158d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 21597a3c3d58SStefano Zampini PetscBool cisdense; 2160a9fe9ddaSSatish Balay 2161ee16a9a1SHong Zhang PetscFunctionBegin; 21624222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 21637a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 21647a3c3d58SStefano Zampini if (!cisdense) { 21657a3c3d58SStefano Zampini PetscBool flg; 21667a3c3d58SStefano Zampini 2167ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 21684222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 21697a3c3d58SStefano Zampini } 217018992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2171ee16a9a1SHong Zhang PetscFunctionReturn(0); 2172ee16a9a1SHong Zhang } 2173a9fe9ddaSSatish Balay 2174a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2175a9fe9ddaSSatish Balay { 2176*6718818eSStefano Zampini Mat_SeqDense *a=(Mat_SeqDense*)A->data,*b=(Mat_SeqDense*)B->data,*c=(Mat_SeqDense*)C->data; 21770805154bSBarry Smith PetscBLASInt m,n,k; 2178ca15aa20SStefano Zampini const PetscScalar *av,*bv; 2179ca15aa20SStefano Zampini PetscScalar *cv; 2180a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2181c2916339SPierre Jolivet PetscErrorCode ierr; 2182a9fe9ddaSSatish Balay 2183a9fe9ddaSSatish Balay PetscFunctionBegin; 21848208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 21858208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2186c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 218749d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2188ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2189ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2190*6718818eSStefano Zampini ierr = MatDenseGetArrayWrite(C,&cv);CHKERRQ(ierr); 2191ca15aa20SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2192ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2193ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2194ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2195*6718818eSStefano Zampini ierr = MatDenseRestoreArrayWrite(C,&cv);CHKERRQ(ierr); 2196a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2197a9fe9ddaSSatish Balay } 2198a9fe9ddaSSatish Balay 21994222ddf1SHong Zhang PetscErrorCode MatMatTransposeMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 220069f65d41SStefano Zampini { 220169f65d41SStefano Zampini PetscErrorCode ierr; 220269f65d41SStefano Zampini PetscInt m=A->rmap->n,n=B->rmap->n; 22037a3c3d58SStefano Zampini PetscBool cisdense; 220469f65d41SStefano Zampini 220569f65d41SStefano Zampini PetscFunctionBegin; 22064222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22077a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22087a3c3d58SStefano Zampini if (!cisdense) { 22097a3c3d58SStefano Zampini PetscBool flg; 22107a3c3d58SStefano Zampini 2211ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22124222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22137a3c3d58SStefano Zampini } 221418992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 221569f65d41SStefano Zampini PetscFunctionReturn(0); 221669f65d41SStefano Zampini } 221769f65d41SStefano Zampini 221869f65d41SStefano Zampini PetscErrorCode MatMatTransposeMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 221969f65d41SStefano Zampini { 222069f65d41SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 222169f65d41SStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 222269f65d41SStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)C->data; 2223*6718818eSStefano Zampini const PetscScalar *av,*bv; 2224*6718818eSStefano Zampini PetscScalar *cv; 222569f65d41SStefano Zampini PetscBLASInt m,n,k; 222669f65d41SStefano Zampini PetscScalar _DOne=1.0,_DZero=0.0; 222769f65d41SStefano Zampini PetscErrorCode ierr; 222869f65d41SStefano Zampini 222969f65d41SStefano Zampini PetscFunctionBegin; 223049d0e964SStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 223149d0e964SStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 223269f65d41SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 223349d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2234*6718818eSStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2235*6718818eSStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2236*6718818eSStefano Zampini ierr = MatDenseGetArrayWrite(C,&cv);CHKERRQ(ierr); 2237*6718818eSStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","T",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2238*6718818eSStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2239*6718818eSStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2240*6718818eSStefano Zampini ierr = MatDenseRestoreArrayWrite(C,&cv);CHKERRQ(ierr); 2241ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 224269f65d41SStefano Zampini PetscFunctionReturn(0); 224369f65d41SStefano Zampini } 224469f65d41SStefano Zampini 22454222ddf1SHong Zhang PetscErrorCode MatTransposeMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2246a9fe9ddaSSatish Balay { 2247ee16a9a1SHong Zhang PetscErrorCode ierr; 2248d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 22497a3c3d58SStefano Zampini PetscBool cisdense; 2250a9fe9ddaSSatish Balay 2251ee16a9a1SHong Zhang PetscFunctionBegin; 22524222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22537a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22547a3c3d58SStefano Zampini if (!cisdense) { 22557a3c3d58SStefano Zampini PetscBool flg; 22567a3c3d58SStefano Zampini 2257ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22584222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22597a3c3d58SStefano Zampini } 226018992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2261ee16a9a1SHong Zhang PetscFunctionReturn(0); 2262ee16a9a1SHong Zhang } 2263a9fe9ddaSSatish Balay 226475648e8dSHong Zhang PetscErrorCode MatTransposeMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2265a9fe9ddaSSatish Balay { 2266a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2267a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2268a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 2269*6718818eSStefano Zampini const PetscScalar *av,*bv; 2270*6718818eSStefano Zampini PetscScalar *cv; 22710805154bSBarry Smith PetscBLASInt m,n,k; 2272a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2273c5df96a5SBarry Smith PetscErrorCode ierr; 2274a9fe9ddaSSatish Balay 2275a9fe9ddaSSatish Balay PetscFunctionBegin; 22768208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 22778208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2278c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&k);CHKERRQ(ierr); 227949d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2280*6718818eSStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2281*6718818eSStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2282*6718818eSStefano Zampini ierr = MatDenseGetArrayWrite(C,&cv);CHKERRQ(ierr); 2283*6718818eSStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2284*6718818eSStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2285*6718818eSStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2286*6718818eSStefano Zampini ierr = MatDenseRestoreArrayWrite(C,&cv);CHKERRQ(ierr); 2287ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2288a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2289a9fe9ddaSSatish Balay } 2290985db425SBarry Smith 22914222ddf1SHong Zhang /* ----------------------------------------------- */ 22924222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AB(Mat C) 22934222ddf1SHong Zhang { 22944222ddf1SHong Zhang PetscFunctionBegin; 22954222ddf1SHong Zhang C->ops->matmultsymbolic = MatMatMultSymbolic_SeqDense_SeqDense; 22964222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB; 22974222ddf1SHong Zhang PetscFunctionReturn(0); 22984222ddf1SHong Zhang } 22994222ddf1SHong Zhang 23004222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AtB(Mat C) 23014222ddf1SHong Zhang { 23024222ddf1SHong Zhang PetscFunctionBegin; 23034222ddf1SHong Zhang C->ops->transposematmultsymbolic = MatTransposeMatMultSymbolic_SeqDense_SeqDense; 23044222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AtB; 23054222ddf1SHong Zhang PetscFunctionReturn(0); 23064222ddf1SHong Zhang } 23074222ddf1SHong Zhang 23084222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_ABt(Mat C) 23094222ddf1SHong Zhang { 23104222ddf1SHong Zhang PetscFunctionBegin; 23114222ddf1SHong Zhang C->ops->mattransposemultsymbolic = MatMatTransposeMultSymbolic_SeqDense_SeqDense; 23124222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_ABt; 23134222ddf1SHong Zhang PetscFunctionReturn(0); 23144222ddf1SHong Zhang } 23154222ddf1SHong Zhang 23164222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqDense(Mat C) 23174222ddf1SHong Zhang { 23184222ddf1SHong Zhang PetscErrorCode ierr; 23194222ddf1SHong Zhang Mat_Product *product = C->product; 23204222ddf1SHong Zhang 23214222ddf1SHong Zhang PetscFunctionBegin; 23224222ddf1SHong Zhang switch (product->type) { 23234222ddf1SHong Zhang case MATPRODUCT_AB: 23244222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AB(C);CHKERRQ(ierr); 23254222ddf1SHong Zhang break; 23264222ddf1SHong Zhang case MATPRODUCT_AtB: 23274222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AtB(C);CHKERRQ(ierr); 23284222ddf1SHong Zhang break; 23294222ddf1SHong Zhang case MATPRODUCT_ABt: 23304222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_ABt(C);CHKERRQ(ierr); 23314222ddf1SHong Zhang break; 2332*6718818eSStefano Zampini default: 23334222ddf1SHong Zhang break; 23344222ddf1SHong Zhang } 23354222ddf1SHong Zhang PetscFunctionReturn(0); 23364222ddf1SHong Zhang } 23374222ddf1SHong Zhang /* ----------------------------------------------- */ 23384222ddf1SHong Zhang 2339e0877f53SBarry Smith static PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 2340985db425SBarry Smith { 2341985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2342985db425SBarry Smith PetscErrorCode ierr; 2343d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2344985db425SBarry Smith PetscScalar *x; 2345ca15aa20SStefano Zampini const PetscScalar *aa; 2346985db425SBarry Smith 2347985db425SBarry Smith PetscFunctionBegin; 2348e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2349985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2350985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2351ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2352e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2353985db425SBarry Smith for (i=0; i<m; i++) { 2354985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2355985db425SBarry Smith for (j=1; j<n; j++) { 2356ca15aa20SStefano Zampini if (PetscRealPart(x[i]) < PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2357985db425SBarry Smith } 2358985db425SBarry Smith } 2359ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2360985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2361985db425SBarry Smith PetscFunctionReturn(0); 2362985db425SBarry Smith } 2363985db425SBarry Smith 2364e0877f53SBarry Smith static PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 2365985db425SBarry Smith { 2366985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2367985db425SBarry Smith PetscErrorCode ierr; 2368d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2369985db425SBarry Smith PetscScalar *x; 2370985db425SBarry Smith PetscReal atmp; 2371ca15aa20SStefano Zampini const PetscScalar *aa; 2372985db425SBarry Smith 2373985db425SBarry Smith PetscFunctionBegin; 2374e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2375985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2376985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2377ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2378e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2379985db425SBarry Smith for (i=0; i<m; i++) { 23809189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 2381985db425SBarry Smith for (j=1; j<n; j++) { 2382ca15aa20SStefano Zampini atmp = PetscAbsScalar(aa[i+a->lda*j]); 2383985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 2384985db425SBarry Smith } 2385985db425SBarry Smith } 2386ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2387985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2388985db425SBarry Smith PetscFunctionReturn(0); 2389985db425SBarry Smith } 2390985db425SBarry Smith 2391e0877f53SBarry Smith static PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 2392985db425SBarry Smith { 2393985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2394985db425SBarry Smith PetscErrorCode ierr; 2395d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2396985db425SBarry Smith PetscScalar *x; 2397ca15aa20SStefano Zampini const PetscScalar *aa; 2398985db425SBarry Smith 2399985db425SBarry Smith PetscFunctionBegin; 2400e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2401ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2402985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2403985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2404e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2405985db425SBarry Smith for (i=0; i<m; i++) { 2406985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2407985db425SBarry Smith for (j=1; j<n; j++) { 2408ca15aa20SStefano Zampini if (PetscRealPart(x[i]) > PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2409985db425SBarry Smith } 2410985db425SBarry Smith } 2411985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2412ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2413985db425SBarry Smith PetscFunctionReturn(0); 2414985db425SBarry Smith } 2415985db425SBarry Smith 2416637a0070SStefano Zampini PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 24178d0534beSBarry Smith { 24188d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 24198d0534beSBarry Smith PetscErrorCode ierr; 24208d0534beSBarry Smith PetscScalar *x; 2421ca15aa20SStefano Zampini const PetscScalar *aa; 24228d0534beSBarry Smith 24238d0534beSBarry Smith PetscFunctionBegin; 2424e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2425ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 24268d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2427ca15aa20SStefano Zampini ierr = PetscArraycpy(x,aa+col*a->lda,A->rmap->n);CHKERRQ(ierr); 24288d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2429ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 24308d0534beSBarry Smith PetscFunctionReturn(0); 24318d0534beSBarry Smith } 24328d0534beSBarry Smith 243352c5f739Sprj- PETSC_INTERN PetscErrorCode MatGetColumnNorms_SeqDense(Mat A,NormType type,PetscReal *norms) 24340716a85fSBarry Smith { 24350716a85fSBarry Smith PetscErrorCode ierr; 24360716a85fSBarry Smith PetscInt i,j,m,n; 24371683a169SBarry Smith const PetscScalar *a; 24380716a85fSBarry Smith 24390716a85fSBarry Smith PetscFunctionBegin; 24400716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 2441580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 24421683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&a);CHKERRQ(ierr); 24430716a85fSBarry Smith if (type == NORM_2) { 24440716a85fSBarry Smith for (i=0; i<n; i++) { 24450716a85fSBarry Smith for (j=0; j<m; j++) { 24460716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]*a[j]); 24470716a85fSBarry Smith } 24480716a85fSBarry Smith a += m; 24490716a85fSBarry Smith } 24500716a85fSBarry Smith } else if (type == NORM_1) { 24510716a85fSBarry Smith for (i=0; i<n; i++) { 24520716a85fSBarry Smith for (j=0; j<m; j++) { 24530716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]); 24540716a85fSBarry Smith } 24550716a85fSBarry Smith a += m; 24560716a85fSBarry Smith } 24570716a85fSBarry Smith } else if (type == NORM_INFINITY) { 24580716a85fSBarry Smith for (i=0; i<n; i++) { 24590716a85fSBarry Smith for (j=0; j<m; j++) { 24600716a85fSBarry Smith norms[i] = PetscMax(PetscAbsScalar(a[j]),norms[i]); 24610716a85fSBarry Smith } 24620716a85fSBarry Smith a += m; 24630716a85fSBarry Smith } 2464ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Unknown NormType"); 24651683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&a);CHKERRQ(ierr); 24660716a85fSBarry Smith if (type == NORM_2) { 24678f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 24680716a85fSBarry Smith } 24690716a85fSBarry Smith PetscFunctionReturn(0); 24700716a85fSBarry Smith } 24710716a85fSBarry Smith 247273a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqDense(Mat x,PetscRandom rctx) 247373a71a0fSBarry Smith { 247473a71a0fSBarry Smith PetscErrorCode ierr; 247573a71a0fSBarry Smith PetscScalar *a; 2476637a0070SStefano Zampini PetscInt lda,m,n,i,j; 247773a71a0fSBarry Smith 247873a71a0fSBarry Smith PetscFunctionBegin; 247973a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 2480637a0070SStefano Zampini ierr = MatDenseGetLDA(x,&lda);CHKERRQ(ierr); 24818c778c55SBarry Smith ierr = MatDenseGetArray(x,&a);CHKERRQ(ierr); 2482637a0070SStefano Zampini for (j=0; j<n; j++) { 2483637a0070SStefano Zampini for (i=0; i<m; i++) { 2484637a0070SStefano Zampini ierr = PetscRandomGetValue(rctx,a+j*lda+i);CHKERRQ(ierr); 2485637a0070SStefano Zampini } 248673a71a0fSBarry Smith } 24878c778c55SBarry Smith ierr = MatDenseRestoreArray(x,&a);CHKERRQ(ierr); 248873a71a0fSBarry Smith PetscFunctionReturn(0); 248973a71a0fSBarry Smith } 249073a71a0fSBarry Smith 24913b49f96aSBarry Smith static PetscErrorCode MatMissingDiagonal_SeqDense(Mat A,PetscBool *missing,PetscInt *d) 24923b49f96aSBarry Smith { 24933b49f96aSBarry Smith PetscFunctionBegin; 24943b49f96aSBarry Smith *missing = PETSC_FALSE; 24953b49f96aSBarry Smith PetscFunctionReturn(0); 24963b49f96aSBarry Smith } 249773a71a0fSBarry Smith 2498ca15aa20SStefano Zampini /* vals is not const */ 2499af53bab2SHong Zhang static PetscErrorCode MatDenseGetColumn_SeqDense(Mat A,PetscInt col,PetscScalar **vals) 250086aefd0dSHong Zhang { 2501ca15aa20SStefano Zampini PetscErrorCode ierr; 250286aefd0dSHong Zhang Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2503ca15aa20SStefano Zampini PetscScalar *v; 250486aefd0dSHong Zhang 250586aefd0dSHong Zhang PetscFunctionBegin; 250686aefd0dSHong Zhang if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2507ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 2508ca15aa20SStefano Zampini *vals = v+col*a->lda; 2509ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 251086aefd0dSHong Zhang PetscFunctionReturn(0); 251186aefd0dSHong Zhang } 251286aefd0dSHong Zhang 2513af53bab2SHong Zhang static PetscErrorCode MatDenseRestoreColumn_SeqDense(Mat A,PetscScalar **vals) 251486aefd0dSHong Zhang { 251586aefd0dSHong Zhang PetscFunctionBegin; 251686aefd0dSHong Zhang *vals = 0; /* user cannot accidently use the array later */ 251786aefd0dSHong Zhang PetscFunctionReturn(0); 251886aefd0dSHong Zhang } 2519abc3b08eSStefano Zampini 2520289bc588SBarry Smith /* -------------------------------------------------------------------*/ 2521a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqDense, 2522905e6a2fSBarry Smith MatGetRow_SeqDense, 2523905e6a2fSBarry Smith MatRestoreRow_SeqDense, 2524905e6a2fSBarry Smith MatMult_SeqDense, 252597304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 25267c922b88SBarry Smith MatMultTranspose_SeqDense, 25277c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 2528db4efbfdSBarry Smith 0, 2529db4efbfdSBarry Smith 0, 2530db4efbfdSBarry Smith 0, 2531db4efbfdSBarry Smith /* 10*/ 0, 2532905e6a2fSBarry Smith MatLUFactor_SeqDense, 2533905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 253441f059aeSBarry Smith MatSOR_SeqDense, 2535ec8511deSBarry Smith MatTranspose_SeqDense, 253697304618SKris Buschelman /* 15*/ MatGetInfo_SeqDense, 2537905e6a2fSBarry Smith MatEqual_SeqDense, 2538905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 2539905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 2540905e6a2fSBarry Smith MatNorm_SeqDense, 2541c0aa2d19SHong Zhang /* 20*/ MatAssemblyBegin_SeqDense, 2542c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 2543905e6a2fSBarry Smith MatSetOption_SeqDense, 2544905e6a2fSBarry Smith MatZeroEntries_SeqDense, 2545d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqDense, 2546db4efbfdSBarry Smith 0, 2547db4efbfdSBarry Smith 0, 2548db4efbfdSBarry Smith 0, 2549db4efbfdSBarry Smith 0, 25504994cf47SJed Brown /* 29*/ MatSetUp_SeqDense, 2551273d9f13SBarry Smith 0, 2552905e6a2fSBarry Smith 0, 255373a71a0fSBarry Smith 0, 255473a71a0fSBarry Smith 0, 2555d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqDense, 2556a5ae1ecdSBarry Smith 0, 2557a5ae1ecdSBarry Smith 0, 2558a5ae1ecdSBarry Smith 0, 2559a5ae1ecdSBarry Smith 0, 2560d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqDense, 25617dae84e0SHong Zhang MatCreateSubMatrices_SeqDense, 2562a5ae1ecdSBarry Smith 0, 25634b0e389bSBarry Smith MatGetValues_SeqDense, 2564a5ae1ecdSBarry Smith MatCopy_SeqDense, 2565d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqDense, 2566a5ae1ecdSBarry Smith MatScale_SeqDense, 25677d68702bSBarry Smith MatShift_Basic, 2568a5ae1ecdSBarry Smith 0, 25693f49a652SStefano Zampini MatZeroRowsColumns_SeqDense, 257073a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqDense, 2571a5ae1ecdSBarry Smith 0, 2572a5ae1ecdSBarry Smith 0, 2573a5ae1ecdSBarry Smith 0, 2574a5ae1ecdSBarry Smith 0, 2575d519adbfSMatthew Knepley /* 54*/ 0, 2576a5ae1ecdSBarry Smith 0, 2577a5ae1ecdSBarry Smith 0, 2578a5ae1ecdSBarry Smith 0, 2579a5ae1ecdSBarry Smith 0, 2580d519adbfSMatthew Knepley /* 59*/ 0, 2581e03a110bSBarry Smith MatDestroy_SeqDense, 2582e03a110bSBarry Smith MatView_SeqDense, 2583357abbc8SBarry Smith 0, 258497304618SKris Buschelman 0, 2585d519adbfSMatthew Knepley /* 64*/ 0, 258697304618SKris Buschelman 0, 258797304618SKris Buschelman 0, 258897304618SKris Buschelman 0, 258997304618SKris Buschelman 0, 2590d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqDense, 259197304618SKris Buschelman 0, 259297304618SKris Buschelman 0, 259397304618SKris Buschelman 0, 259497304618SKris Buschelman 0, 2595d519adbfSMatthew Knepley /* 74*/ 0, 259697304618SKris Buschelman 0, 259797304618SKris Buschelman 0, 259897304618SKris Buschelman 0, 259997304618SKris Buschelman 0, 2600d519adbfSMatthew Knepley /* 79*/ 0, 260197304618SKris Buschelman 0, 260297304618SKris Buschelman 0, 260397304618SKris Buschelman 0, 26045bba2384SShri Abhyankar /* 83*/ MatLoad_SeqDense, 2605637a0070SStefano Zampini MatIsSymmetric_SeqDense, 26061cbb95d3SBarry Smith MatIsHermitian_SeqDense, 2607865e5f61SKris Buschelman 0, 2608865e5f61SKris Buschelman 0, 2609865e5f61SKris Buschelman 0, 26104222ddf1SHong Zhang /* 89*/ 0, 26114222ddf1SHong Zhang 0, 2612a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 26134222ddf1SHong Zhang 0, 26144222ddf1SHong Zhang 0, 26154222ddf1SHong Zhang /* 94*/ 0, 26164222ddf1SHong Zhang 0, 26174222ddf1SHong Zhang 0, 261869f65d41SStefano Zampini MatMatTransposeMultNumeric_SeqDense_SeqDense, 2619284134d9SBarry Smith 0, 26204222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqDense, 2621284134d9SBarry Smith 0, 2622284134d9SBarry Smith 0, 2623ba337c44SJed Brown MatConjugate_SeqDense, 2624f73d5cc4SBarry Smith 0, 2625ba337c44SJed Brown /*104*/ 0, 2626ba337c44SJed Brown MatRealPart_SeqDense, 2627ba337c44SJed Brown MatImaginaryPart_SeqDense, 2628985db425SBarry Smith 0, 2629985db425SBarry Smith 0, 26308208b9aeSStefano Zampini /*109*/ 0, 2631985db425SBarry Smith 0, 26328d0534beSBarry Smith MatGetRowMin_SeqDense, 2633aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 26343b49f96aSBarry Smith MatMissingDiagonal_SeqDense, 2635aabbc4fbSShri Abhyankar /*114*/ 0, 2636aabbc4fbSShri Abhyankar 0, 2637aabbc4fbSShri Abhyankar 0, 2638aabbc4fbSShri Abhyankar 0, 2639aabbc4fbSShri Abhyankar 0, 2640aabbc4fbSShri Abhyankar /*119*/ 0, 2641aabbc4fbSShri Abhyankar 0, 2642aabbc4fbSShri Abhyankar 0, 26430716a85fSBarry Smith 0, 26440716a85fSBarry Smith 0, 26450716a85fSBarry Smith /*124*/ 0, 26465df89d91SHong Zhang MatGetColumnNorms_SeqDense, 26475df89d91SHong Zhang 0, 26485df89d91SHong Zhang 0, 26495df89d91SHong Zhang 0, 26505df89d91SHong Zhang /*129*/ 0, 26514222ddf1SHong Zhang 0, 26524222ddf1SHong Zhang 0, 265375648e8dSHong Zhang MatTransposeMatMultNumeric_SeqDense_SeqDense, 26543964eb88SJed Brown 0, 26553964eb88SJed Brown /*134*/ 0, 26563964eb88SJed Brown 0, 26573964eb88SJed Brown 0, 26583964eb88SJed Brown 0, 26593964eb88SJed Brown 0, 26603964eb88SJed Brown /*139*/ 0, 2661f9426fe0SMark Adams 0, 2662d528f656SJakub Kruzik 0, 2663d528f656SJakub Kruzik 0, 2664d528f656SJakub Kruzik 0, 26654222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqDense, 26664222ddf1SHong Zhang /*145*/ 0, 26674222ddf1SHong Zhang 0, 26684222ddf1SHong Zhang 0 2669985db425SBarry Smith }; 267090ace30eSBarry Smith 26714b828684SBarry Smith /*@C 2672fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 2673d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 2674d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 2675289bc588SBarry Smith 2676d083f849SBarry Smith Collective 2677db81eaa0SLois Curfman McInnes 267820563c6bSBarry Smith Input Parameters: 2679db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 26800c775827SLois Curfman McInnes . m - number of rows 268118f449edSLois Curfman McInnes . n - number of columns 26820298fd71SBarry Smith - data - optional location of matrix data in column major order. Set data=NULL for PETSc 2683dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 268420563c6bSBarry Smith 268520563c6bSBarry Smith Output Parameter: 268644cd7ae7SLois Curfman McInnes . A - the matrix 268720563c6bSBarry Smith 2688b259b22eSLois Curfman McInnes Notes: 268918f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 269018f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 26910298fd71SBarry Smith set data=NULL. 269218f449edSLois Curfman McInnes 2693027ccd11SLois Curfman McInnes Level: intermediate 2694027ccd11SLois Curfman McInnes 269569b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues() 269620563c6bSBarry Smith @*/ 26977087cfbeSBarry Smith PetscErrorCode MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 2698289bc588SBarry Smith { 2699dfbe8321SBarry Smith PetscErrorCode ierr; 27003b2fbd54SBarry Smith 27013a40ed3dSBarry Smith PetscFunctionBegin; 2702f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 2703f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 2704273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 2705273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 2706273d9f13SBarry Smith PetscFunctionReturn(0); 2707273d9f13SBarry Smith } 2708273d9f13SBarry Smith 2709273d9f13SBarry Smith /*@C 2710273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 2711273d9f13SBarry Smith 2712d083f849SBarry Smith Collective 2713273d9f13SBarry Smith 2714273d9f13SBarry Smith Input Parameters: 27151c4f3114SJed Brown + B - the matrix 27160298fd71SBarry Smith - data - the array (or NULL) 2717273d9f13SBarry Smith 2718273d9f13SBarry Smith Notes: 2719273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 2720273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 2721284134d9SBarry Smith need not call this routine. 2722273d9f13SBarry Smith 2723273d9f13SBarry Smith Level: intermediate 2724273d9f13SBarry Smith 2725ad16ce7aSStefano Zampini .seealso: MatCreate(), MatCreateDense(), MatSetValues(), MatDenseSetLDA() 2726867c911aSBarry Smith 2727273d9f13SBarry Smith @*/ 27287087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 2729273d9f13SBarry Smith { 27304ac538c5SBarry Smith PetscErrorCode ierr; 2731a23d5eceSKris Buschelman 2732a23d5eceSKris Buschelman PetscFunctionBegin; 2733d5ea218eSStefano Zampini PetscValidHeaderSpecific(B,MAT_CLASSID,1); 27344ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 2735a23d5eceSKris Buschelman PetscFunctionReturn(0); 2736a23d5eceSKris Buschelman } 2737a23d5eceSKris Buschelman 27387087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 2739a23d5eceSKris Buschelman { 2740ad16ce7aSStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2741dfbe8321SBarry Smith PetscErrorCode ierr; 2742273d9f13SBarry Smith 2743273d9f13SBarry Smith PetscFunctionBegin; 2744273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 2745a868139aSShri Abhyankar 274634ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 274734ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 274834ef9618SShri Abhyankar 2749ad16ce7aSStefano Zampini if (b->lda <= 0) b->lda = B->rmap->n; 275086d161a7SShri Abhyankar 2751ad16ce7aSStefano Zampini ierr = PetscIntMultError(b->lda,B->cmap->n,NULL);CHKERRQ(ierr); 27529e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 27539e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2754ad16ce7aSStefano Zampini ierr = PetscCalloc1((size_t)b->lda*B->cmap->n,&b->v);CHKERRQ(ierr); 2755ad16ce7aSStefano Zampini ierr = PetscLogObjectMemory((PetscObject)B,b->lda*B->cmap->n*sizeof(PetscScalar));CHKERRQ(ierr); 27562205254eSKarl Rupp 27579e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 2758273d9f13SBarry Smith } else { /* user-allocated storage */ 27599e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2760273d9f13SBarry Smith b->v = data; 2761273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2762273d9f13SBarry Smith } 27630450473dSBarry Smith B->assembled = PETSC_TRUE; 2764273d9f13SBarry Smith PetscFunctionReturn(0); 2765273d9f13SBarry Smith } 2766273d9f13SBarry Smith 276765b80a83SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2768cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_Elemental(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 27698baccfbdSHong Zhang { 2770d77f618aSHong Zhang Mat mat_elemental; 2771d77f618aSHong Zhang PetscErrorCode ierr; 27721683a169SBarry Smith const PetscScalar *array; 27731683a169SBarry Smith PetscScalar *v_colwise; 2774d77f618aSHong Zhang PetscInt M=A->rmap->N,N=A->cmap->N,i,j,k,*rows,*cols; 2775d77f618aSHong Zhang 27768baccfbdSHong Zhang PetscFunctionBegin; 2777d77f618aSHong Zhang ierr = PetscMalloc3(M*N,&v_colwise,M,&rows,N,&cols);CHKERRQ(ierr); 27781683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&array);CHKERRQ(ierr); 2779d77f618aSHong Zhang /* convert column-wise array into row-wise v_colwise, see MatSetValues_Elemental() */ 2780d77f618aSHong Zhang k = 0; 2781d77f618aSHong Zhang for (j=0; j<N; j++) { 2782d77f618aSHong Zhang cols[j] = j; 2783d77f618aSHong Zhang for (i=0; i<M; i++) { 2784d77f618aSHong Zhang v_colwise[j*M+i] = array[k++]; 2785d77f618aSHong Zhang } 2786d77f618aSHong Zhang } 2787d77f618aSHong Zhang for (i=0; i<M; i++) { 2788d77f618aSHong Zhang rows[i] = i; 2789d77f618aSHong Zhang } 27901683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&array);CHKERRQ(ierr); 2791d77f618aSHong Zhang 2792d77f618aSHong Zhang ierr = MatCreate(PetscObjectComm((PetscObject)A), &mat_elemental);CHKERRQ(ierr); 2793d77f618aSHong Zhang ierr = MatSetSizes(mat_elemental,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2794d77f618aSHong Zhang ierr = MatSetType(mat_elemental,MATELEMENTAL);CHKERRQ(ierr); 2795d77f618aSHong Zhang ierr = MatSetUp(mat_elemental);CHKERRQ(ierr); 2796d77f618aSHong Zhang 2797d77f618aSHong Zhang /* PETSc-Elemental interaface uses axpy for setting off-processor entries, only ADD_VALUES is allowed */ 2798d77f618aSHong Zhang ierr = MatSetValues(mat_elemental,M,rows,N,cols,v_colwise,ADD_VALUES);CHKERRQ(ierr); 2799d77f618aSHong Zhang ierr = MatAssemblyBegin(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2800d77f618aSHong Zhang ierr = MatAssemblyEnd(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2801d77f618aSHong Zhang ierr = PetscFree3(v_colwise,rows,cols);CHKERRQ(ierr); 2802d77f618aSHong Zhang 2803511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 280428be2f97SBarry Smith ierr = MatHeaderReplace(A,&mat_elemental);CHKERRQ(ierr); 2805d77f618aSHong Zhang } else { 2806d77f618aSHong Zhang *newmat = mat_elemental; 2807d77f618aSHong Zhang } 28088baccfbdSHong Zhang PetscFunctionReturn(0); 28098baccfbdSHong Zhang } 281065b80a83SHong Zhang #endif 28118baccfbdSHong Zhang 2812ad16ce7aSStefano Zampini static PetscErrorCode MatDenseSetLDA_SeqDense(Mat B,PetscInt lda) 28131b807ce4Svictorle { 28141b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 281521a2c019SBarry Smith 28161b807ce4Svictorle PetscFunctionBegin; 2817e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 28181b807ce4Svictorle b->lda = lda; 28191b807ce4Svictorle PetscFunctionReturn(0); 28201b807ce4Svictorle } 28211b807ce4Svictorle 2822d528f656SJakub Kruzik PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqDense(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 2823d528f656SJakub Kruzik { 2824d528f656SJakub Kruzik PetscErrorCode ierr; 2825d528f656SJakub Kruzik PetscMPIInt size; 2826d528f656SJakub Kruzik 2827d528f656SJakub Kruzik PetscFunctionBegin; 2828d528f656SJakub Kruzik ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 2829d528f656SJakub Kruzik if (size == 1) { 2830d528f656SJakub Kruzik if (scall == MAT_INITIAL_MATRIX) { 2831d528f656SJakub Kruzik ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 2832d528f656SJakub Kruzik } else { 2833d528f656SJakub Kruzik ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2834d528f656SJakub Kruzik } 2835d528f656SJakub Kruzik } else { 2836d528f656SJakub Kruzik ierr = MatCreateMPIMatConcatenateSeqMat_MPIDense(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 2837d528f656SJakub Kruzik } 2838d528f656SJakub Kruzik PetscFunctionReturn(0); 2839d528f656SJakub Kruzik } 2840d528f656SJakub Kruzik 28416947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28426947451fSStefano Zampini { 28436947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28446947451fSStefano Zampini PetscErrorCode ierr; 28456947451fSStefano Zampini 28466947451fSStefano Zampini PetscFunctionBegin; 28476947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 28486947451fSStefano Zampini if (!a->cvec) { 28496947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 28506947451fSStefano Zampini } 28516947451fSStefano Zampini a->vecinuse = col + 1; 28526947451fSStefano Zampini ierr = MatDenseGetArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 28536947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 28546947451fSStefano Zampini *v = a->cvec; 28556947451fSStefano Zampini PetscFunctionReturn(0); 28566947451fSStefano Zampini } 28576947451fSStefano Zampini 28586947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28596947451fSStefano Zampini { 28606947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28616947451fSStefano Zampini PetscErrorCode ierr; 28626947451fSStefano Zampini 28636947451fSStefano Zampini PetscFunctionBegin; 28646947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 28656947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 28666947451fSStefano Zampini a->vecinuse = 0; 28676947451fSStefano Zampini ierr = MatDenseRestoreArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 28686947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 28696947451fSStefano Zampini *v = NULL; 28706947451fSStefano Zampini PetscFunctionReturn(0); 28716947451fSStefano Zampini } 28726947451fSStefano Zampini 28736947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 28746947451fSStefano Zampini { 28756947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28766947451fSStefano Zampini PetscErrorCode ierr; 28776947451fSStefano Zampini 28786947451fSStefano Zampini PetscFunctionBegin; 28796947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 28806947451fSStefano Zampini if (!a->cvec) { 28816947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 28826947451fSStefano Zampini } 28836947451fSStefano Zampini a->vecinuse = col + 1; 28846947451fSStefano Zampini ierr = MatDenseGetArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 28856947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 28866947451fSStefano Zampini ierr = VecLockReadPush(a->cvec);CHKERRQ(ierr); 28876947451fSStefano Zampini *v = a->cvec; 28886947451fSStefano Zampini PetscFunctionReturn(0); 28896947451fSStefano Zampini } 28906947451fSStefano Zampini 28916947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 28926947451fSStefano Zampini { 28936947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28946947451fSStefano Zampini PetscErrorCode ierr; 28956947451fSStefano Zampini 28966947451fSStefano Zampini PetscFunctionBegin; 28976947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 28986947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 28996947451fSStefano Zampini a->vecinuse = 0; 29006947451fSStefano Zampini ierr = MatDenseRestoreArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 29016947451fSStefano Zampini ierr = VecLockReadPop(a->cvec);CHKERRQ(ierr); 29026947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29036947451fSStefano Zampini *v = NULL; 29046947451fSStefano Zampini PetscFunctionReturn(0); 29056947451fSStefano Zampini } 29066947451fSStefano Zampini 29076947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29086947451fSStefano Zampini { 29096947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29106947451fSStefano Zampini PetscErrorCode ierr; 29116947451fSStefano Zampini 29126947451fSStefano Zampini PetscFunctionBegin; 29136947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 29146947451fSStefano Zampini if (!a->cvec) { 29156947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 29166947451fSStefano Zampini } 29176947451fSStefano Zampini a->vecinuse = col + 1; 29186947451fSStefano Zampini ierr = MatDenseGetArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29196947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 29206947451fSStefano Zampini *v = a->cvec; 29216947451fSStefano Zampini PetscFunctionReturn(0); 29226947451fSStefano Zampini } 29236947451fSStefano Zampini 29246947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29256947451fSStefano Zampini { 29266947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29276947451fSStefano Zampini PetscErrorCode ierr; 29286947451fSStefano Zampini 29296947451fSStefano Zampini PetscFunctionBegin; 29306947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29316947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29326947451fSStefano Zampini a->vecinuse = 0; 29336947451fSStefano Zampini ierr = MatDenseRestoreArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29346947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29356947451fSStefano Zampini *v = NULL; 29366947451fSStefano Zampini PetscFunctionReturn(0); 29376947451fSStefano Zampini } 29386947451fSStefano Zampini 29390bad9183SKris Buschelman /*MC 2940fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 29410bad9183SKris Buschelman 29420bad9183SKris Buschelman Options Database Keys: 29430bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 29440bad9183SKris Buschelman 29450bad9183SKris Buschelman Level: beginner 29460bad9183SKris Buschelman 294789665df3SBarry Smith .seealso: MatCreateSeqDense() 294889665df3SBarry Smith 29490bad9183SKris Buschelman M*/ 2950ca15aa20SStefano Zampini PetscErrorCode MatCreate_SeqDense(Mat B) 2951273d9f13SBarry Smith { 2952273d9f13SBarry Smith Mat_SeqDense *b; 2953dfbe8321SBarry Smith PetscErrorCode ierr; 29547c334f02SBarry Smith PetscMPIInt size; 2955273d9f13SBarry Smith 2956273d9f13SBarry Smith PetscFunctionBegin; 2957ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 2958e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 295955659b69SBarry Smith 2960b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 2961549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 296244cd7ae7SLois Curfman McInnes B->data = (void*)b; 296318f449edSLois Curfman McInnes 2964273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 29654e220ebcSLois Curfman McInnes 296649a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetLDA_C",MatDenseGetLDA_SeqDense);CHKERRQ(ierr); 2967ad16ce7aSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseSetLDA_C",MatDenseSetLDA_SeqDense);CHKERRQ(ierr); 2968bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArray_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 29698572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArray_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 2970d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDensePlaceArray_C",MatDensePlaceArray_SeqDense);CHKERRQ(ierr); 2971d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseResetArray_C",MatDenseResetArray_SeqDense);CHKERRQ(ierr); 2972d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseReplaceArray_C",MatDenseReplaceArray_SeqDense);CHKERRQ(ierr); 29738572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayRead_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 2974715b7558SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayRead_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 29756947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayWrite_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 29766947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayWrite_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 2977bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqaij_C",MatConvert_SeqDense_SeqAIJ);CHKERRQ(ierr); 29788baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 29798baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_elemental_C",MatConvert_SeqDense_Elemental);CHKERRQ(ierr); 29808baccfbdSHong Zhang #endif 29812bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 29822bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqdensecuda_C",MatConvert_SeqDense_SeqDenseCUDA);CHKERRQ(ierr); 29834222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 29844222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 2985637a0070SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 29864222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 29872bf066beSStefano Zampini #endif 2988bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqDenseSetPreallocation_C",MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 29894222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 29904222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 29914222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 29924222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqsbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 299396e6d5c4SRichard Tran Mills 2994af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumn_C",MatDenseGetColumn_SeqDense);CHKERRQ(ierr); 2995af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumn_C",MatDenseRestoreColumn_SeqDense);CHKERRQ(ierr); 29966947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVec_C",MatDenseGetColumnVec_SeqDense);CHKERRQ(ierr); 29976947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVec_C",MatDenseRestoreColumnVec_SeqDense);CHKERRQ(ierr); 29986947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecRead_C",MatDenseGetColumnVecRead_SeqDense);CHKERRQ(ierr); 29996947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecRead_C",MatDenseRestoreColumnVecRead_SeqDense);CHKERRQ(ierr); 30006947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecWrite_C",MatDenseGetColumnVecWrite_SeqDense);CHKERRQ(ierr); 30016947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecWrite_C",MatDenseRestoreColumnVecWrite_SeqDense);CHKERRQ(ierr); 300217667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 30033a40ed3dSBarry Smith PetscFunctionReturn(0); 3004289bc588SBarry Smith } 300586aefd0dSHong Zhang 300686aefd0dSHong Zhang /*@C 3007af53bab2SHong Zhang MatDenseGetColumn - gives access to a column of a dense matrix. This is only the local part of the column. You MUST call MatDenseRestoreColumn() to avoid memory bleeding. 300886aefd0dSHong Zhang 300986aefd0dSHong Zhang Not Collective 301086aefd0dSHong Zhang 301186aefd0dSHong Zhang Input Parameter: 301286aefd0dSHong Zhang + mat - a MATSEQDENSE or MATMPIDENSE matrix 301386aefd0dSHong Zhang - col - column index 301486aefd0dSHong Zhang 301586aefd0dSHong Zhang Output Parameter: 301686aefd0dSHong Zhang . vals - pointer to the data 301786aefd0dSHong Zhang 301886aefd0dSHong Zhang Level: intermediate 301986aefd0dSHong Zhang 302086aefd0dSHong Zhang .seealso: MatDenseRestoreColumn() 302186aefd0dSHong Zhang @*/ 302286aefd0dSHong Zhang PetscErrorCode MatDenseGetColumn(Mat A,PetscInt col,PetscScalar **vals) 302386aefd0dSHong Zhang { 302486aefd0dSHong Zhang PetscErrorCode ierr; 302586aefd0dSHong Zhang 302686aefd0dSHong Zhang PetscFunctionBegin; 3027d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3028d5ea218eSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 3029d5ea218eSStefano Zampini PetscValidPointer(vals,3); 303086aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseGetColumn_C",(Mat,PetscInt,PetscScalar**),(A,col,vals));CHKERRQ(ierr); 303186aefd0dSHong Zhang PetscFunctionReturn(0); 303286aefd0dSHong Zhang } 303386aefd0dSHong Zhang 303486aefd0dSHong Zhang /*@C 303586aefd0dSHong Zhang MatDenseRestoreColumn - returns access to a column of a dense matrix which is returned by MatDenseGetColumn(). 303686aefd0dSHong Zhang 303786aefd0dSHong Zhang Not Collective 303886aefd0dSHong Zhang 303986aefd0dSHong Zhang Input Parameter: 304086aefd0dSHong Zhang . mat - a MATSEQDENSE or MATMPIDENSE matrix 304186aefd0dSHong Zhang 304286aefd0dSHong Zhang Output Parameter: 304386aefd0dSHong Zhang . vals - pointer to the data 304486aefd0dSHong Zhang 304586aefd0dSHong Zhang Level: intermediate 304686aefd0dSHong Zhang 304786aefd0dSHong Zhang .seealso: MatDenseGetColumn() 304886aefd0dSHong Zhang @*/ 304986aefd0dSHong Zhang PetscErrorCode MatDenseRestoreColumn(Mat A,PetscScalar **vals) 305086aefd0dSHong Zhang { 305186aefd0dSHong Zhang PetscErrorCode ierr; 305286aefd0dSHong Zhang 305386aefd0dSHong Zhang PetscFunctionBegin; 3054d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3055d5ea218eSStefano Zampini PetscValidPointer(vals,2); 305686aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseRestoreColumn_C",(Mat,PetscScalar**),(A,vals));CHKERRQ(ierr); 305786aefd0dSHong Zhang PetscFunctionReturn(0); 305886aefd0dSHong Zhang } 30596947451fSStefano Zampini 30606947451fSStefano Zampini /*@C 30616947451fSStefano Zampini MatDenseGetColumnVec - Gives read-write access to a column of a dense matrix, represented as a Vec. 30626947451fSStefano Zampini 30636947451fSStefano Zampini Collective 30646947451fSStefano Zampini 30656947451fSStefano Zampini Input Parameter: 30666947451fSStefano Zampini + mat - the Mat object 30676947451fSStefano Zampini - col - the column index 30686947451fSStefano Zampini 30696947451fSStefano Zampini Output Parameter: 30706947451fSStefano Zampini . v - the vector 30716947451fSStefano Zampini 30726947451fSStefano Zampini Notes: 30736947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVec() when the vector is no longer needed. 30746947451fSStefano Zampini Use MatDenseGetColumnVecRead() to obtain read-only access or MatDenseGetColumnVecWrite() for write-only access. 30756947451fSStefano Zampini 30766947451fSStefano Zampini Level: intermediate 30776947451fSStefano Zampini 30786947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 30796947451fSStefano Zampini @*/ 30806947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec(Mat A,PetscInt col,Vec *v) 30816947451fSStefano Zampini { 30826947451fSStefano Zampini PetscErrorCode ierr; 30836947451fSStefano Zampini 30846947451fSStefano Zampini PetscFunctionBegin; 30856947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 30866947451fSStefano Zampini PetscValidType(A,1); 30876947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 30886947451fSStefano Zampini PetscValidPointer(v,3); 30896947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 30906947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 30916947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 30926947451fSStefano Zampini PetscFunctionReturn(0); 30936947451fSStefano Zampini } 30946947451fSStefano Zampini 30956947451fSStefano Zampini /*@C 30966947451fSStefano Zampini MatDenseRestoreColumnVec - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVec(). 30976947451fSStefano Zampini 30986947451fSStefano Zampini Collective 30996947451fSStefano Zampini 31006947451fSStefano Zampini Input Parameter: 31016947451fSStefano Zampini + mat - the Mat object 31026947451fSStefano Zampini . col - the column index 31036947451fSStefano Zampini - v - the Vec object 31046947451fSStefano Zampini 31056947451fSStefano Zampini Level: intermediate 31066947451fSStefano Zampini 31076947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31086947451fSStefano Zampini @*/ 31096947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec(Mat A,PetscInt col,Vec *v) 31106947451fSStefano Zampini { 31116947451fSStefano Zampini PetscErrorCode ierr; 31126947451fSStefano Zampini 31136947451fSStefano Zampini PetscFunctionBegin; 31146947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31156947451fSStefano Zampini PetscValidType(A,1); 31166947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31176947451fSStefano Zampini PetscValidPointer(v,3); 31186947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31196947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31206947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31216947451fSStefano Zampini PetscFunctionReturn(0); 31226947451fSStefano Zampini } 31236947451fSStefano Zampini 31246947451fSStefano Zampini /*@C 31256947451fSStefano Zampini MatDenseGetColumnVecRead - Gives read-only access to a column of a dense matrix, represented as a Vec. 31266947451fSStefano Zampini 31276947451fSStefano Zampini Collective 31286947451fSStefano Zampini 31296947451fSStefano Zampini Input Parameter: 31306947451fSStefano Zampini + mat - the Mat object 31316947451fSStefano Zampini - col - the column index 31326947451fSStefano Zampini 31336947451fSStefano Zampini Output Parameter: 31346947451fSStefano Zampini . v - the vector 31356947451fSStefano Zampini 31366947451fSStefano Zampini Notes: 31376947451fSStefano Zampini The vector is owned by PETSc and users cannot modify it. 31386947451fSStefano Zampini Users need to call MatDenseRestoreColumnVecRead() when the vector is no longer needed. 31396947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecWrite() for write-only access. 31406947451fSStefano Zampini 31416947451fSStefano Zampini Level: intermediate 31426947451fSStefano Zampini 31436947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31446947451fSStefano Zampini @*/ 31456947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead(Mat A,PetscInt col,Vec *v) 31466947451fSStefano Zampini { 31476947451fSStefano Zampini PetscErrorCode ierr; 31486947451fSStefano Zampini 31496947451fSStefano Zampini PetscFunctionBegin; 31506947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31516947451fSStefano Zampini PetscValidType(A,1); 31526947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31536947451fSStefano Zampini PetscValidPointer(v,3); 31546947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31556947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31566947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31576947451fSStefano Zampini PetscFunctionReturn(0); 31586947451fSStefano Zampini } 31596947451fSStefano Zampini 31606947451fSStefano Zampini /*@C 31616947451fSStefano Zampini MatDenseRestoreColumnVecRead - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecRead(). 31626947451fSStefano Zampini 31636947451fSStefano Zampini Collective 31646947451fSStefano Zampini 31656947451fSStefano Zampini Input Parameter: 31666947451fSStefano Zampini + mat - the Mat object 31676947451fSStefano Zampini . col - the column index 31686947451fSStefano Zampini - v - the Vec object 31696947451fSStefano Zampini 31706947451fSStefano Zampini Level: intermediate 31716947451fSStefano Zampini 31726947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecWrite() 31736947451fSStefano Zampini @*/ 31746947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead(Mat A,PetscInt col,Vec *v) 31756947451fSStefano Zampini { 31766947451fSStefano Zampini PetscErrorCode ierr; 31776947451fSStefano Zampini 31786947451fSStefano Zampini PetscFunctionBegin; 31796947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31806947451fSStefano Zampini PetscValidType(A,1); 31816947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31826947451fSStefano Zampini PetscValidPointer(v,3); 31836947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31846947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31856947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31866947451fSStefano Zampini PetscFunctionReturn(0); 31876947451fSStefano Zampini } 31886947451fSStefano Zampini 31896947451fSStefano Zampini /*@C 31906947451fSStefano Zampini MatDenseGetColumnVecWrite - Gives write-only access to a column of a dense matrix, represented as a Vec. 31916947451fSStefano Zampini 31926947451fSStefano Zampini Collective 31936947451fSStefano Zampini 31946947451fSStefano Zampini Input Parameter: 31956947451fSStefano Zampini + mat - the Mat object 31966947451fSStefano Zampini - col - the column index 31976947451fSStefano Zampini 31986947451fSStefano Zampini Output Parameter: 31996947451fSStefano Zampini . v - the vector 32006947451fSStefano Zampini 32016947451fSStefano Zampini Notes: 32026947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVecWrite() when the vector is no longer needed. 32036947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecRead() for read-only access. 32046947451fSStefano Zampini 32056947451fSStefano Zampini Level: intermediate 32066947451fSStefano Zampini 32076947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 32086947451fSStefano Zampini @*/ 32096947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite(Mat A,PetscInt col,Vec *v) 32106947451fSStefano Zampini { 32116947451fSStefano Zampini PetscErrorCode ierr; 32126947451fSStefano Zampini 32136947451fSStefano Zampini PetscFunctionBegin; 32146947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32156947451fSStefano Zampini PetscValidType(A,1); 32166947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32176947451fSStefano Zampini PetscValidPointer(v,3); 32186947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32196947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32206947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32216947451fSStefano Zampini PetscFunctionReturn(0); 32226947451fSStefano Zampini } 32236947451fSStefano Zampini 32246947451fSStefano Zampini /*@C 32256947451fSStefano Zampini MatDenseRestoreColumnVecWrite - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecWrite(). 32266947451fSStefano Zampini 32276947451fSStefano Zampini Collective 32286947451fSStefano Zampini 32296947451fSStefano Zampini Input Parameter: 32306947451fSStefano Zampini + mat - the Mat object 32316947451fSStefano Zampini . col - the column index 32326947451fSStefano Zampini - v - the Vec object 32336947451fSStefano Zampini 32346947451fSStefano Zampini Level: intermediate 32356947451fSStefano Zampini 32366947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead() 32376947451fSStefano Zampini @*/ 32386947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite(Mat A,PetscInt col,Vec *v) 32396947451fSStefano Zampini { 32406947451fSStefano Zampini PetscErrorCode ierr; 32416947451fSStefano Zampini 32426947451fSStefano Zampini PetscFunctionBegin; 32436947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32446947451fSStefano Zampini PetscValidType(A,1); 32456947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32466947451fSStefano Zampini PetscValidPointer(v,3); 32476947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32486947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32496947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32506947451fSStefano Zampini PetscFunctionReturn(0); 32516947451fSStefano Zampini } 3252