1be1d678aSKris Buschelman 267e560aaSBarry Smith /* 367e560aaSBarry Smith Defines the basic matrix operations for sequential dense. 467e560aaSBarry Smith */ 5289bc588SBarry Smith 6dec5eb66SMatthew G Knepley #include <../src/mat/impls/dense/seq/dense.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8289bc588SBarry Smith 96a63e612SBarry Smith #include <../src/mat/impls/aij/seq/aij.h> 10b2573a8aSBarry Smith 11ca15aa20SStefano Zampini PetscErrorCode MatSeqDenseSymmetrize_Private(Mat A, PetscBool hermitian) 128c178816SStefano Zampini { 138c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 148c178816SStefano Zampini PetscInt j, k, n = A->rmap->n; 15ca15aa20SStefano Zampini PetscScalar *v; 16ca15aa20SStefano Zampini PetscErrorCode ierr; 178c178816SStefano Zampini 188c178816SStefano Zampini PetscFunctionBegin; 198c178816SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot symmetrize a rectangular matrix"); 20ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 218c178816SStefano Zampini if (!hermitian) { 228c178816SStefano Zampini for (k=0;k<n;k++) { 238c178816SStefano Zampini for (j=k;j<n;j++) { 24ca15aa20SStefano Zampini v[j*mat->lda + k] = v[k*mat->lda + j]; 258c178816SStefano Zampini } 268c178816SStefano Zampini } 278c178816SStefano Zampini } else { 288c178816SStefano Zampini for (k=0;k<n;k++) { 298c178816SStefano Zampini for (j=k;j<n;j++) { 30ca15aa20SStefano Zampini v[j*mat->lda + k] = PetscConj(v[k*mat->lda + j]); 318c178816SStefano Zampini } 328c178816SStefano Zampini } 338c178816SStefano Zampini } 34ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 358c178816SStefano Zampini PetscFunctionReturn(0); 368c178816SStefano Zampini } 378c178816SStefano Zampini 3805709791SSatish Balay PETSC_EXTERN PetscErrorCode MatSeqDenseInvertFactors_Private(Mat A) 398c178816SStefano Zampini { 408c178816SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 418c178816SStefano Zampini PetscErrorCode ierr; 428c178816SStefano Zampini PetscBLASInt info,n; 438c178816SStefano Zampini 448c178816SStefano Zampini PetscFunctionBegin; 458c178816SStefano Zampini if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 468c178816SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 478c178816SStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 488c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 498c178816SStefano Zampini if (!mat->fwork) { 508c178816SStefano Zampini mat->lfwork = n; 518c178816SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 528c178816SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 538c178816SStefano Zampini } 5400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 558c178816SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 5600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 588c178816SStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 598c178816SStefano Zampini if (A->spd) { 6000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 618c178816SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_("L",&n,mat->v,&mat->lda,&info)); 6200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 638c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 648c178816SStefano Zampini #if defined(PETSC_USE_COMPLEX) 658c178816SStefano Zampini } else if (A->hermitian) { 668c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 678c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 6800121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 698c178816SStefano Zampini PetscStackCallBLAS("LAPACKhetri",LAPACKhetri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7000121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 718c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_TRUE);CHKERRQ(ierr); 728c178816SStefano Zampini #endif 738c178816SStefano Zampini } else { /* symmetric case */ 748c178816SStefano Zampini if (!mat->pivots) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Pivots not present"); 758c178816SStefano Zampini if (!mat->fwork) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Fwork not present"); 7600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 778c178816SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&info)); 7800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 798c178816SStefano Zampini ierr = MatSeqDenseSymmetrize_Private(A,PETSC_FALSE);CHKERRQ(ierr); 808c178816SStefano Zampini } 818c178816SStefano Zampini if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad Inversion: zero pivot in row %D",(PetscInt)info-1); 82ca15aa20SStefano Zampini ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 838c178816SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 848c178816SStefano Zampini 858c178816SStefano Zampini A->ops->solve = NULL; 868c178816SStefano Zampini A->ops->matsolve = NULL; 878c178816SStefano Zampini A->ops->solvetranspose = NULL; 888c178816SStefano Zampini A->ops->matsolvetranspose = NULL; 898c178816SStefano Zampini A->ops->solveadd = NULL; 908c178816SStefano Zampini A->ops->solvetransposeadd = NULL; 918c178816SStefano Zampini A->factortype = MAT_FACTOR_NONE; 928c178816SStefano Zampini ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 938c178816SStefano Zampini PetscFunctionReturn(0); 948c178816SStefano Zampini } 958c178816SStefano Zampini 963f49a652SStefano Zampini PetscErrorCode MatZeroRowsColumns_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 973f49a652SStefano Zampini { 983f49a652SStefano Zampini PetscErrorCode ierr; 993f49a652SStefano Zampini Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1003f49a652SStefano Zampini PetscInt m = l->lda, n = A->cmap->n,r = A->rmap->n, i,j; 101ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 1023f49a652SStefano Zampini const PetscScalar *xx; 1033f49a652SStefano Zampini 1043f49a652SStefano Zampini PetscFunctionBegin; 10576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1063f49a652SStefano Zampini for (i=0; i<N; i++) { 1073f49a652SStefano Zampini if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1083f49a652SStefano Zampini if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1093f49a652SStefano Zampini if (rows[i] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Col %D requested to be zeroed greater than or equal number of cols %D",rows[i],A->cmap->n); 1103f49a652SStefano Zampini } 11176bd3646SJed Brown } 112ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1133f49a652SStefano Zampini 1143f49a652SStefano Zampini /* fix right hand side if needed */ 1153f49a652SStefano Zampini if (x && b) { 1166c4d906cSStefano Zampini Vec xt; 1176c4d906cSStefano Zampini 1186c4d906cSStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1196c4d906cSStefano Zampini ierr = VecDuplicate(x,&xt);CHKERRQ(ierr); 1206c4d906cSStefano Zampini ierr = VecCopy(x,xt);CHKERRQ(ierr); 1216c4d906cSStefano Zampini ierr = VecScale(xt,-1.0);CHKERRQ(ierr); 1226c4d906cSStefano Zampini ierr = MatMultAdd(A,xt,b,b);CHKERRQ(ierr); 1236c4d906cSStefano Zampini ierr = VecDestroy(&xt);CHKERRQ(ierr); 1243f49a652SStefano Zampini ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 1253f49a652SStefano Zampini ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 1263f49a652SStefano Zampini for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 1273f49a652SStefano Zampini ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 1283f49a652SStefano Zampini ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 1293f49a652SStefano Zampini } 1303f49a652SStefano Zampini 131ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1323f49a652SStefano Zampini for (i=0; i<N; i++) { 133ca15aa20SStefano Zampini slot = v + rows[i]*m; 134580bdb30SBarry Smith ierr = PetscArrayzero(slot,r);CHKERRQ(ierr); 1353f49a652SStefano Zampini } 1363f49a652SStefano Zampini for (i=0; i<N; i++) { 137ca15aa20SStefano Zampini slot = v + rows[i]; 1383f49a652SStefano Zampini for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 1393f49a652SStefano Zampini } 1403f49a652SStefano Zampini if (diag != 0.0) { 1413f49a652SStefano Zampini if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 1423f49a652SStefano Zampini for (i=0; i<N; i++) { 143ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1443f49a652SStefano Zampini *slot = diag; 1453f49a652SStefano Zampini } 1463f49a652SStefano Zampini } 147ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 1483f49a652SStefano Zampini PetscFunctionReturn(0); 1493f49a652SStefano Zampini } 1503f49a652SStefano Zampini 151abc3b08eSStefano Zampini PetscErrorCode MatPtAPNumeric_SeqDense_SeqDense(Mat A,Mat P,Mat C) 152abc3b08eSStefano Zampini { 153abc3b08eSStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)(C->data); 154abc3b08eSStefano Zampini PetscErrorCode ierr; 155abc3b08eSStefano Zampini 156abc3b08eSStefano Zampini PetscFunctionBegin; 157ca15aa20SStefano Zampini if (c->ptapwork) { 158ca15aa20SStefano Zampini ierr = (*C->ops->matmultnumeric)(A,P,c->ptapwork);CHKERRQ(ierr); 159ca15aa20SStefano Zampini ierr = (*C->ops->transposematmultnumeric)(P,c->ptapwork,C);CHKERRQ(ierr); 1604222ddf1SHong Zhang } else SETERRQ(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"Must call MatPtAPSymbolic_SeqDense_SeqDense() first"); 161abc3b08eSStefano Zampini PetscFunctionReturn(0); 162abc3b08eSStefano Zampini } 163abc3b08eSStefano Zampini 1644222ddf1SHong Zhang PetscErrorCode MatPtAPSymbolic_SeqDense_SeqDense(Mat A,Mat P,PetscReal fill,Mat C) 165abc3b08eSStefano Zampini { 166abc3b08eSStefano Zampini Mat_SeqDense *c; 1677a3c3d58SStefano Zampini PetscBool cisdense; 168abc3b08eSStefano Zampini PetscErrorCode ierr; 169abc3b08eSStefano Zampini 170abc3b08eSStefano Zampini PetscFunctionBegin; 1714222ddf1SHong Zhang ierr = MatSetSizes(C,P->cmap->n,P->cmap->n,P->cmap->N,P->cmap->N);CHKERRQ(ierr); 1727a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 1737a3c3d58SStefano Zampini if (!cisdense) { 1747a3c3d58SStefano Zampini PetscBool flg; 1757a3c3d58SStefano Zampini 1767a3c3d58SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)P,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 1774222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 1787a3c3d58SStefano Zampini } 1797a3c3d58SStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 1804222ddf1SHong Zhang c = (Mat_SeqDense*)C->data; 181ca15aa20SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&c->ptapwork);CHKERRQ(ierr); 182ca15aa20SStefano Zampini ierr = MatSetSizes(c->ptapwork,A->rmap->n,P->cmap->n,A->rmap->N,P->cmap->N);CHKERRQ(ierr); 1837a3c3d58SStefano Zampini ierr = MatSetType(c->ptapwork,((PetscObject)C)->type_name);CHKERRQ(ierr); 1847a3c3d58SStefano Zampini ierr = MatSetUp(c->ptapwork);CHKERRQ(ierr); 185abc3b08eSStefano Zampini PetscFunctionReturn(0); 186abc3b08eSStefano Zampini } 187abc3b08eSStefano Zampini 188cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat A,MatType newtype,MatReuse reuse,Mat *newmat) 189b49cda9fSStefano Zampini { 190a13144ffSStefano Zampini Mat B = NULL; 191b49cda9fSStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 192b49cda9fSStefano Zampini Mat_SeqDense *b; 193b49cda9fSStefano Zampini PetscErrorCode ierr; 194b49cda9fSStefano Zampini PetscInt *ai=a->i,*aj=a->j,m=A->rmap->N,n=A->cmap->N,i; 195b49cda9fSStefano Zampini MatScalar *av=a->a; 196a13144ffSStefano Zampini PetscBool isseqdense; 197b49cda9fSStefano Zampini 198b49cda9fSStefano Zampini PetscFunctionBegin; 199a13144ffSStefano Zampini if (reuse == MAT_REUSE_MATRIX) { 200a13144ffSStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)*newmat,MATSEQDENSE,&isseqdense);CHKERRQ(ierr); 201a32993e3SJed Brown if (!isseqdense) SETERRQ1(PetscObjectComm((PetscObject)*newmat),PETSC_ERR_USER,"Cannot reuse matrix of type %s",((PetscObject)(*newmat))->type_name); 202a13144ffSStefano Zampini } 203a13144ffSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 204b49cda9fSStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 205b49cda9fSStefano Zampini ierr = MatSetSizes(B,m,n,m,n);CHKERRQ(ierr); 206b49cda9fSStefano Zampini ierr = MatSetType(B,MATSEQDENSE);CHKERRQ(ierr); 207b49cda9fSStefano Zampini ierr = MatSeqDenseSetPreallocation(B,NULL);CHKERRQ(ierr); 208b49cda9fSStefano Zampini b = (Mat_SeqDense*)(B->data); 209a13144ffSStefano Zampini } else { 210a13144ffSStefano Zampini b = (Mat_SeqDense*)((*newmat)->data); 211580bdb30SBarry Smith ierr = PetscArrayzero(b->v,m*n);CHKERRQ(ierr); 212a13144ffSStefano Zampini } 213b49cda9fSStefano Zampini for (i=0; i<m; i++) { 214b49cda9fSStefano Zampini PetscInt j; 215b49cda9fSStefano Zampini for (j=0;j<ai[1]-ai[0];j++) { 216b49cda9fSStefano Zampini b->v[*aj*m+i] = *av; 217b49cda9fSStefano Zampini aj++; 218b49cda9fSStefano Zampini av++; 219b49cda9fSStefano Zampini } 220b49cda9fSStefano Zampini ai++; 221b49cda9fSStefano Zampini } 222b49cda9fSStefano Zampini 223511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 224a13144ffSStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 225a13144ffSStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 22628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 227b49cda9fSStefano Zampini } else { 228a13144ffSStefano Zampini if (B) *newmat = B; 229a13144ffSStefano Zampini ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 230a13144ffSStefano Zampini ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 231b49cda9fSStefano Zampini } 232b49cda9fSStefano Zampini PetscFunctionReturn(0); 233b49cda9fSStefano Zampini } 234b49cda9fSStefano Zampini 235cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqAIJ(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 2366a63e612SBarry Smith { 2376a63e612SBarry Smith Mat B; 2386a63e612SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2396a63e612SBarry Smith PetscErrorCode ierr; 2409399e1b8SMatthew G. Knepley PetscInt i, j; 2419399e1b8SMatthew G. Knepley PetscInt *rows, *nnz; 2429399e1b8SMatthew G. Knepley MatScalar *aa = a->v, *vals; 2436a63e612SBarry Smith 2446a63e612SBarry Smith PetscFunctionBegin; 245ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 2466a63e612SBarry Smith ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 2476a63e612SBarry Smith ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 2489399e1b8SMatthew G. Knepley ierr = PetscCalloc3(A->rmap->n,&rows,A->rmap->n,&nnz,A->rmap->n,&vals);CHKERRQ(ierr); 2499399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2509399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) ++nnz[i]; 2516a63e612SBarry Smith aa += a->lda; 2526a63e612SBarry Smith } 2539399e1b8SMatthew G. Knepley ierr = MatSeqAIJSetPreallocation(B,PETSC_DETERMINE,nnz);CHKERRQ(ierr); 2549399e1b8SMatthew G. Knepley aa = a->v; 2559399e1b8SMatthew G. Knepley for (j=0; j<A->cmap->n; j++) { 2569399e1b8SMatthew G. Knepley PetscInt numRows = 0; 2579399e1b8SMatthew G. Knepley for (i=0; i<A->rmap->n; i++) if (aa[i] != 0.0 || i == j) {rows[numRows] = i; vals[numRows++] = aa[i];} 2589399e1b8SMatthew G. Knepley ierr = MatSetValues(B,numRows,rows,1,&j,vals,INSERT_VALUES);CHKERRQ(ierr); 2599399e1b8SMatthew G. Knepley aa += a->lda; 2609399e1b8SMatthew G. Knepley } 2619399e1b8SMatthew G. Knepley ierr = PetscFree3(rows,nnz,vals);CHKERRQ(ierr); 2626a63e612SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2636a63e612SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2646a63e612SBarry Smith 265511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 26628be2f97SBarry Smith ierr = MatHeaderReplace(A,&B);CHKERRQ(ierr); 2676a63e612SBarry Smith } else { 2686a63e612SBarry Smith *newmat = B; 2696a63e612SBarry Smith } 2706a63e612SBarry Smith PetscFunctionReturn(0); 2716a63e612SBarry Smith } 2726a63e612SBarry Smith 273ca15aa20SStefano Zampini PetscErrorCode MatAXPY_SeqDense(Mat Y,PetscScalar alpha,Mat X,MatStructure str) 2741987afe7SBarry Smith { 2751987afe7SBarry Smith Mat_SeqDense *x = (Mat_SeqDense*)X->data,*y = (Mat_SeqDense*)Y->data; 276ca15aa20SStefano Zampini const PetscScalar *xv; 277ca15aa20SStefano Zampini PetscScalar *yv; 2780805154bSBarry Smith PetscBLASInt N,m,ldax,lday,one = 1; 279efee365bSSatish Balay PetscErrorCode ierr; 2803a40ed3dSBarry Smith 2813a40ed3dSBarry Smith PetscFunctionBegin; 282ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(X,&xv);CHKERRQ(ierr); 283ca15aa20SStefano Zampini ierr = MatDenseGetArray(Y,&yv);CHKERRQ(ierr); 284c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n*X->cmap->n,&N);CHKERRQ(ierr); 285c5df96a5SBarry Smith ierr = PetscBLASIntCast(X->rmap->n,&m);CHKERRQ(ierr); 286c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->lda,&ldax);CHKERRQ(ierr); 287c5df96a5SBarry Smith ierr = PetscBLASIntCast(y->lda,&lday);CHKERRQ(ierr); 288a5ce6ee0Svictorle if (ldax>m || lday>m) { 289ca15aa20SStefano Zampini PetscInt j; 290ca15aa20SStefano Zampini 291d0f46423SBarry Smith for (j=0; j<X->cmap->n; j++) { 292ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&m,&alpha,xv+j*ldax,&one,yv+j*lday,&one)); 293a5ce6ee0Svictorle } 294a5ce6ee0Svictorle } else { 295ca15aa20SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&N,&alpha,xv,&one,yv,&one)); 296a5ce6ee0Svictorle } 297ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(X,&xv);CHKERRQ(ierr); 298ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(Y,&yv);CHKERRQ(ierr); 2990450473dSBarry Smith ierr = PetscLogFlops(PetscMax(2*N-1,0));CHKERRQ(ierr); 3003a40ed3dSBarry Smith PetscFunctionReturn(0); 3011987afe7SBarry Smith } 3021987afe7SBarry Smith 303e0877f53SBarry Smith static PetscErrorCode MatGetInfo_SeqDense(Mat A,MatInfoType flag,MatInfo *info) 304289bc588SBarry Smith { 305ca15aa20SStefano Zampini PetscLogDouble N = A->rmap->n*A->cmap->n; 3063a40ed3dSBarry Smith 3073a40ed3dSBarry Smith PetscFunctionBegin; 3084e220ebcSLois Curfman McInnes info->block_size = 1.0; 309ca15aa20SStefano Zampini info->nz_allocated = N; 310ca15aa20SStefano Zampini info->nz_used = N; 311ca15aa20SStefano Zampini info->nz_unneeded = 0; 312ca15aa20SStefano Zampini info->assemblies = A->num_ass; 3134e220ebcSLois Curfman McInnes info->mallocs = 0; 3147adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 3154e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 3164e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 3174e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 3183a40ed3dSBarry Smith PetscFunctionReturn(0); 319289bc588SBarry Smith } 320289bc588SBarry Smith 321637a0070SStefano Zampini PetscErrorCode MatScale_SeqDense(Mat A,PetscScalar alpha) 32280cd9d93SLois Curfman McInnes { 323273d9f13SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 324ca15aa20SStefano Zampini PetscScalar *v; 325efee365bSSatish Balay PetscErrorCode ierr; 326c5df96a5SBarry Smith PetscBLASInt one = 1,j,nz,lda; 32780cd9d93SLois Curfman McInnes 3283a40ed3dSBarry Smith PetscFunctionBegin; 329ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 330c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->lda,&lda);CHKERRQ(ierr); 331d0f46423SBarry Smith if (lda>A->rmap->n) { 332c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&nz);CHKERRQ(ierr); 333d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 334ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v+j*lda,&one)); 335a5ce6ee0Svictorle } 336a5ce6ee0Svictorle } else { 337c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n*A->cmap->n,&nz);CHKERRQ(ierr); 338ca15aa20SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&nz,&alpha,v,&one)); 339a5ce6ee0Svictorle } 340efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 341ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 3423a40ed3dSBarry Smith PetscFunctionReturn(0); 34380cd9d93SLois Curfman McInnes } 34480cd9d93SLois Curfman McInnes 345e0877f53SBarry Smith static PetscErrorCode MatIsHermitian_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 3461cbb95d3SBarry Smith { 3471cbb95d3SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 348ca15aa20SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 349ca15aa20SStefano Zampini const PetscScalar *v; 350ca15aa20SStefano Zampini PetscErrorCode ierr; 3511cbb95d3SBarry Smith 3521cbb95d3SBarry Smith PetscFunctionBegin; 3531cbb95d3SBarry Smith *fl = PETSC_FALSE; 354d0f46423SBarry Smith if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 355ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 3561cbb95d3SBarry Smith for (i=0; i<m; i++) { 357ca15aa20SStefano Zampini for (j=i; j<m; j++) { 358637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - PetscConj(v[j+i*N])) > rtol) { 359637a0070SStefano Zampini goto restore; 3601cbb95d3SBarry Smith } 3611cbb95d3SBarry Smith } 362637a0070SStefano Zampini } 3631cbb95d3SBarry Smith *fl = PETSC_TRUE; 364637a0070SStefano Zampini restore: 365637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 366637a0070SStefano Zampini PetscFunctionReturn(0); 367637a0070SStefano Zampini } 368637a0070SStefano Zampini 369637a0070SStefano Zampini static PetscErrorCode MatIsSymmetric_SeqDense(Mat A,PetscReal rtol,PetscBool *fl) 370637a0070SStefano Zampini { 371637a0070SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 372637a0070SStefano Zampini PetscInt i,j,m = A->rmap->n,N = a->lda; 373637a0070SStefano Zampini const PetscScalar *v; 374637a0070SStefano Zampini PetscErrorCode ierr; 375637a0070SStefano Zampini 376637a0070SStefano Zampini PetscFunctionBegin; 377637a0070SStefano Zampini *fl = PETSC_FALSE; 378637a0070SStefano Zampini if (A->rmap->n != A->cmap->n) PetscFunctionReturn(0); 379637a0070SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 380637a0070SStefano Zampini for (i=0; i<m; i++) { 381637a0070SStefano Zampini for (j=i; j<m; j++) { 382637a0070SStefano Zampini if (PetscAbsScalar(v[i+j*N] - v[j+i*N]) > rtol) { 383637a0070SStefano Zampini goto restore; 384637a0070SStefano Zampini } 385637a0070SStefano Zampini } 386637a0070SStefano Zampini } 387637a0070SStefano Zampini *fl = PETSC_TRUE; 388637a0070SStefano Zampini restore: 389637a0070SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 3901cbb95d3SBarry Smith PetscFunctionReturn(0); 3911cbb95d3SBarry Smith } 3921cbb95d3SBarry Smith 393ca15aa20SStefano Zampini PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat newi,Mat A,MatDuplicateOption cpvalues) 394b24902e0SBarry Smith { 395ca15aa20SStefano Zampini Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 396b24902e0SBarry Smith PetscErrorCode ierr; 397*23fc5dcaSStefano Zampini PetscInt lda = (PetscInt)mat->lda,j,m,nlda = lda; 398b24902e0SBarry Smith 399b24902e0SBarry Smith PetscFunctionBegin; 400aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&newi->rmap);CHKERRQ(ierr); 401aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&newi->cmap);CHKERRQ(ierr); 402*23fc5dcaSStefano Zampini if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { /* propagate LDA */ 403*23fc5dcaSStefano Zampini ierr = MatDenseSetLDA(newi,lda);CHKERRQ(ierr); 404*23fc5dcaSStefano Zampini } 4050298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newi,NULL);CHKERRQ(ierr); 406b24902e0SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 407ca15aa20SStefano Zampini const PetscScalar *av; 408ca15aa20SStefano Zampini PetscScalar *v; 409ca15aa20SStefano Zampini 410ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 411ca15aa20SStefano Zampini ierr = MatDenseGetArray(newi,&v);CHKERRQ(ierr); 412*23fc5dcaSStefano Zampini ierr = MatDenseGetLDA(newi,&nlda);CHKERRQ(ierr); 413d0f46423SBarry Smith m = A->rmap->n; 414*23fc5dcaSStefano Zampini if (lda>m || nlda>m) { 415d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 416*23fc5dcaSStefano Zampini ierr = PetscArraycpy(v+j*nlda,av+j*lda,m);CHKERRQ(ierr); 417b24902e0SBarry Smith } 418b24902e0SBarry Smith } else { 419ca15aa20SStefano Zampini ierr = PetscArraycpy(v,av,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 420b24902e0SBarry Smith } 421ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newi,&v);CHKERRQ(ierr); 422ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 423b24902e0SBarry Smith } 424b24902e0SBarry Smith PetscFunctionReturn(0); 425b24902e0SBarry Smith } 426b24902e0SBarry Smith 427ca15aa20SStefano Zampini PetscErrorCode MatDuplicate_SeqDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 42802cad45dSBarry Smith { 4296849ba73SBarry Smith PetscErrorCode ierr; 43002cad45dSBarry Smith 4313a40ed3dSBarry Smith PetscFunctionBegin; 432ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),newmat);CHKERRQ(ierr); 433d0f46423SBarry Smith ierr = MatSetSizes(*newmat,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4345c9eb25fSBarry Smith ierr = MatSetType(*newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 435719d5645SBarry Smith ierr = MatDuplicateNoCreate_SeqDense(*newmat,A,cpvalues);CHKERRQ(ierr); 436b24902e0SBarry Smith PetscFunctionReturn(0); 437b24902e0SBarry Smith } 438b24902e0SBarry Smith 439e0877f53SBarry Smith static PetscErrorCode MatLUFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 440289bc588SBarry Smith { 4414482741eSBarry Smith MatFactorInfo info; 442a093e273SMatthew Knepley PetscErrorCode ierr; 4433a40ed3dSBarry Smith 4443a40ed3dSBarry Smith PetscFunctionBegin; 445c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 446ca15aa20SStefano Zampini ierr = (*fact->ops->lufactor)(fact,0,0,&info);CHKERRQ(ierr); 4473a40ed3dSBarry Smith PetscFunctionReturn(0); 448289bc588SBarry Smith } 4496ee01492SSatish Balay 450e0877f53SBarry Smith static PetscErrorCode MatSolve_SeqDense(Mat A,Vec xx,Vec yy) 451289bc588SBarry Smith { 452c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 4536849ba73SBarry Smith PetscErrorCode ierr; 454f1ceaac6SMatthew G. Knepley const PetscScalar *x; 455f1ceaac6SMatthew G. Knepley PetscScalar *y; 456c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 45767e560aaSBarry Smith 4583a40ed3dSBarry Smith PetscFunctionBegin; 459c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 460f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 4611ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 462580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 463d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_LU) { 46400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4658b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 46600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 467e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 468d5f3da31SBarry Smith } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 469a49dc2a2SStefano Zampini if (A->spd) { 47000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 4718b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 47200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 473e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 474a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 475a49dc2a2SStefano Zampini } else if (A->hermitian) { 47600121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 477a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 47800121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 479a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 480a49dc2a2SStefano Zampini #endif 481a49dc2a2SStefano Zampini } else { /* symmetric case */ 48200121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 483a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 48400121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 485a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 486a49dc2a2SStefano Zampini } 4872205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 488f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 4891ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 490dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 4913a40ed3dSBarry Smith PetscFunctionReturn(0); 492289bc588SBarry Smith } 4936ee01492SSatish Balay 494e0877f53SBarry Smith static PetscErrorCode MatMatSolve_SeqDense(Mat A,Mat B,Mat X) 49585e2c93fSHong Zhang { 49685e2c93fSHong Zhang Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 49785e2c93fSHong Zhang PetscErrorCode ierr; 4981683a169SBarry Smith const PetscScalar *b; 4991683a169SBarry Smith PetscScalar *x; 500efb80c78SLisandro Dalcin PetscInt n; 501783b601eSJed Brown PetscBLASInt nrhs,info,m; 50285e2c93fSHong Zhang 50385e2c93fSHong Zhang PetscFunctionBegin; 504c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 5050298fd71SBarry Smith ierr = MatGetSize(B,NULL,&n);CHKERRQ(ierr); 506c5df96a5SBarry Smith ierr = PetscBLASIntCast(n,&nrhs);CHKERRQ(ierr); 5071683a169SBarry Smith ierr = MatDenseGetArrayRead(B,&b);CHKERRQ(ierr); 5088c778c55SBarry Smith ierr = MatDenseGetArray(X,&x);CHKERRQ(ierr); 50985e2c93fSHong Zhang 510580bdb30SBarry Smith ierr = PetscArraycpy(x,b,m*nrhs);CHKERRQ(ierr); 51185e2c93fSHong Zhang 51285e2c93fSHong Zhang if (A->factortype == MAT_FACTOR_LU) { 51300121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5148b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("N",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 51500121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 51685e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"GETRS - Bad solve"); 51785e2c93fSHong Zhang } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 518a49dc2a2SStefano Zampini if (A->spd) { 51900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5208b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&nrhs,mat->v,&mat->lda,x,&m,&info)); 52100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 52285e2c93fSHong Zhang if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 523a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 524a49dc2a2SStefano Zampini } else if (A->hermitian) { 52500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 526a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 52700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 528a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"HETRS Bad solve"); 529a49dc2a2SStefano Zampini #endif 530a49dc2a2SStefano Zampini } else { /* symmetric case */ 53100121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 532a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&nrhs,mat->v,&mat->lda,mat->pivots,x,&m,&info)); 53300121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 534a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 535a49dc2a2SStefano Zampini } 5362205254eSKarl Rupp } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 53785e2c93fSHong Zhang 5381683a169SBarry Smith ierr = MatDenseRestoreArrayRead(B,&b);CHKERRQ(ierr); 5398c778c55SBarry Smith ierr = MatDenseRestoreArray(X,&x);CHKERRQ(ierr); 54085e2c93fSHong Zhang ierr = PetscLogFlops(nrhs*(2.0*m*m - m));CHKERRQ(ierr); 54185e2c93fSHong Zhang PetscFunctionReturn(0); 54285e2c93fSHong Zhang } 54385e2c93fSHong Zhang 54400121966SStefano Zampini static PetscErrorCode MatConjugate_SeqDense(Mat); 54500121966SStefano Zampini 546e0877f53SBarry Smith static PetscErrorCode MatSolveTranspose_SeqDense(Mat A,Vec xx,Vec yy) 547da3a660dSBarry Smith { 548c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 549dfbe8321SBarry Smith PetscErrorCode ierr; 550f1ceaac6SMatthew G. Knepley const PetscScalar *x; 551f1ceaac6SMatthew G. Knepley PetscScalar *y; 552c5df96a5SBarry Smith PetscBLASInt one = 1,info,m; 55367e560aaSBarry Smith 5543a40ed3dSBarry Smith PetscFunctionBegin; 555c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 556f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 5571ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 558580bdb30SBarry Smith ierr = PetscArraycpy(y,x,A->rmap->n);CHKERRQ(ierr); 5598208b9aeSStefano Zampini if (A->factortype == MAT_FACTOR_LU) { 56000121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5618b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_("T",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 56200121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 563e32f2f54SBarry Smith if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS - Bad solve"); 5648208b9aeSStefano Zampini } else if (A->factortype == MAT_FACTOR_CHOLESKY) { 565a49dc2a2SStefano Zampini if (A->spd) { 56600121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 56700121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 56800121966SStefano Zampini #endif 56900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 5708b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_("L",&m,&one,mat->v,&mat->lda,y,&m,&info)); 57100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 57200121966SStefano Zampini #if defined(PETSC_USE_COMPLEX) 57300121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57400121966SStefano Zampini #endif 575a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"POTRS Bad solve"); 576a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 577a49dc2a2SStefano Zampini } else if (A->hermitian) { 57800121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 57900121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 58000121966SStefano Zampini PetscStackCallBLAS("LAPACKhetrs",LAPACKhetrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58100121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 58200121966SStefano Zampini ierr = MatConjugate_SeqDense(A);CHKERRQ(ierr); 583ae7cfcebSSatish Balay #endif 584a49dc2a2SStefano Zampini } else { /* symmetric case */ 58500121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 586a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_("L",&m,&one,mat->v,&mat->lda,mat->pivots,y,&m,&info)); 58700121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 588a49dc2a2SStefano Zampini if (info) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"SYTRS Bad solve"); 589da3a660dSBarry Smith } 590a49dc2a2SStefano Zampini } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix must be factored to solve"); 591f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 5921ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 593dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 5943a40ed3dSBarry Smith PetscFunctionReturn(0); 595da3a660dSBarry Smith } 5966ee01492SSatish Balay 597db4efbfdSBarry Smith /* ---------------------------------------------------------------*/ 598db4efbfdSBarry Smith /* COMMENT: I have chosen to hide row permutation in the pivots, 599db4efbfdSBarry Smith rather than put it in the Mat->row slot.*/ 600ca15aa20SStefano Zampini PetscErrorCode MatLUFactor_SeqDense(Mat A,IS row,IS col,const MatFactorInfo *minfo) 601db4efbfdSBarry Smith { 602db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 603db4efbfdSBarry Smith PetscErrorCode ierr; 604db4efbfdSBarry Smith PetscBLASInt n,m,info; 605db4efbfdSBarry Smith 606db4efbfdSBarry Smith PetscFunctionBegin; 607c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 608c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 609db4efbfdSBarry Smith if (!mat->pivots) { 6108208b9aeSStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 6113bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 612db4efbfdSBarry Smith } 613db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 6148e57ea43SSatish Balay ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6158b83055fSJed Brown PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&m,&n,mat->v,&mat->lda,mat->pivots,&info)); 6168e57ea43SSatish Balay ierr = PetscFPTrapPop();CHKERRQ(ierr); 6178e57ea43SSatish Balay 618e32f2f54SBarry Smith if (info<0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Bad argument to LU factorization"); 619e32f2f54SBarry Smith if (info>0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Bad LU factorization"); 6208208b9aeSStefano Zampini 621db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6228208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 623db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 624d5f3da31SBarry Smith A->factortype = MAT_FACTOR_LU; 625db4efbfdSBarry Smith 626f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 627f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 628f6224b95SHong Zhang 629dc0b31edSSatish Balay ierr = PetscLogFlops((2.0*A->cmap->n*A->cmap->n*A->cmap->n)/3);CHKERRQ(ierr); 630db4efbfdSBarry Smith PetscFunctionReturn(0); 631db4efbfdSBarry Smith } 632db4efbfdSBarry Smith 633a49dc2a2SStefano Zampini /* Cholesky as L*L^T or L*D*L^T and the symmetric/hermitian complex variants */ 634ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactor_SeqDense(Mat A,IS perm,const MatFactorInfo *factinfo) 635db4efbfdSBarry Smith { 636db4efbfdSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 637db4efbfdSBarry Smith PetscErrorCode ierr; 638c5df96a5SBarry Smith PetscBLASInt info,n; 639db4efbfdSBarry Smith 640db4efbfdSBarry Smith PetscFunctionBegin; 641c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 642db4efbfdSBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 643a49dc2a2SStefano Zampini if (A->spd) { 64400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 6458b83055fSJed Brown PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_("L",&n,mat->v,&mat->lda,&info)); 64600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 647a49dc2a2SStefano Zampini #if defined(PETSC_USE_COMPLEX) 648a49dc2a2SStefano Zampini } else if (A->hermitian) { 649a49dc2a2SStefano Zampini if (!mat->pivots) { 650a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 651a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 652a49dc2a2SStefano Zampini } 653a49dc2a2SStefano Zampini if (!mat->fwork) { 654a49dc2a2SStefano Zampini PetscScalar dummy; 655a49dc2a2SStefano Zampini 656a49dc2a2SStefano Zampini mat->lfwork = -1; 65700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 658a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 65900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 660a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 661a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 662a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 663a49dc2a2SStefano Zampini } 66400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 665a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKhetrf",LAPACKhetrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 66600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 667a49dc2a2SStefano Zampini #endif 668a49dc2a2SStefano Zampini } else { /* symmetric case */ 669a49dc2a2SStefano Zampini if (!mat->pivots) { 670a49dc2a2SStefano Zampini ierr = PetscMalloc1(A->rmap->n,&mat->pivots);CHKERRQ(ierr); 671a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscBLASInt));CHKERRQ(ierr); 672a49dc2a2SStefano Zampini } 673a49dc2a2SStefano Zampini if (!mat->fwork) { 674a49dc2a2SStefano Zampini PetscScalar dummy; 675a49dc2a2SStefano Zampini 676a49dc2a2SStefano Zampini mat->lfwork = -1; 67700121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 678a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,&dummy,&mat->lfwork,&info)); 67900121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 680a49dc2a2SStefano Zampini mat->lfwork = (PetscInt)PetscRealPart(dummy); 681a49dc2a2SStefano Zampini ierr = PetscMalloc1(mat->lfwork,&mat->fwork);CHKERRQ(ierr); 682a49dc2a2SStefano Zampini ierr = PetscLogObjectMemory((PetscObject)A,mat->lfwork*sizeof(PetscBLASInt));CHKERRQ(ierr); 683a49dc2a2SStefano Zampini } 68400121966SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 685a49dc2a2SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_("L",&n,mat->v,&mat->lda,mat->pivots,mat->fwork,&mat->lfwork,&info)); 68600121966SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 687a49dc2a2SStefano Zampini } 688e32f2f54SBarry Smith if (info) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_CH_ZRPVT,"Bad factorization: zero pivot in row %D",(PetscInt)info-1); 6898208b9aeSStefano Zampini 690db4efbfdSBarry Smith A->ops->solve = MatSolve_SeqDense; 6918208b9aeSStefano Zampini A->ops->matsolve = MatMatSolve_SeqDense; 692db4efbfdSBarry Smith A->ops->solvetranspose = MatSolveTranspose_SeqDense; 693d5f3da31SBarry Smith A->factortype = MAT_FACTOR_CHOLESKY; 6942205254eSKarl Rupp 695f6224b95SHong Zhang ierr = PetscFree(A->solvertype);CHKERRQ(ierr); 696f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&A->solvertype);CHKERRQ(ierr); 697f6224b95SHong Zhang 698eb3f19e4SBarry Smith ierr = PetscLogFlops((1.0*A->cmap->n*A->cmap->n*A->cmap->n)/3.0);CHKERRQ(ierr); 699db4efbfdSBarry Smith PetscFunctionReturn(0); 700db4efbfdSBarry Smith } 701db4efbfdSBarry Smith 7020481f469SBarry Smith PetscErrorCode MatCholeskyFactorNumeric_SeqDense(Mat fact,Mat A,const MatFactorInfo *info_dummy) 703db4efbfdSBarry Smith { 704db4efbfdSBarry Smith PetscErrorCode ierr; 705db4efbfdSBarry Smith MatFactorInfo info; 706db4efbfdSBarry Smith 707db4efbfdSBarry Smith PetscFunctionBegin; 708db4efbfdSBarry Smith info.fill = 1.0; 7092205254eSKarl Rupp 710c3ef05f6SHong Zhang ierr = MatDuplicateNoCreate_SeqDense(fact,A,MAT_COPY_VALUES);CHKERRQ(ierr); 711ca15aa20SStefano Zampini ierr = (*fact->ops->choleskyfactor)(fact,0,&info);CHKERRQ(ierr); 712db4efbfdSBarry Smith PetscFunctionReturn(0); 713db4efbfdSBarry Smith } 714db4efbfdSBarry Smith 715ca15aa20SStefano Zampini PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,const MatFactorInfo *info) 716db4efbfdSBarry Smith { 717db4efbfdSBarry Smith PetscFunctionBegin; 718c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 7191bbcc794SSatish Balay fact->preallocated = PETSC_TRUE; 720719d5645SBarry Smith fact->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqDense; 721bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 722bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 723bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 724db4efbfdSBarry Smith PetscFunctionReturn(0); 725db4efbfdSBarry Smith } 726db4efbfdSBarry Smith 727ca15aa20SStefano Zampini PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat fact,Mat A,IS row,IS col,const MatFactorInfo *info) 728db4efbfdSBarry Smith { 729db4efbfdSBarry Smith PetscFunctionBegin; 730b66fe19dSMatthew G Knepley fact->preallocated = PETSC_TRUE; 731c3ef05f6SHong Zhang fact->assembled = PETSC_TRUE; 732719d5645SBarry Smith fact->ops->lufactornumeric = MatLUFactorNumeric_SeqDense; 733bd443b22SStefano Zampini fact->ops->solve = MatSolve_SeqDense; 734bd443b22SStefano Zampini fact->ops->matsolve = MatMatSolve_SeqDense; 735bd443b22SStefano Zampini fact->ops->solvetranspose = MatSolveTranspose_SeqDense; 736db4efbfdSBarry Smith PetscFunctionReturn(0); 737db4efbfdSBarry Smith } 738db4efbfdSBarry Smith 739ca15aa20SStefano Zampini /* uses LAPACK */ 740cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqdense_petsc(Mat A,MatFactorType ftype,Mat *fact) 741db4efbfdSBarry Smith { 742db4efbfdSBarry Smith PetscErrorCode ierr; 743db4efbfdSBarry Smith 744db4efbfdSBarry Smith PetscFunctionBegin; 745ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),fact);CHKERRQ(ierr); 746db4efbfdSBarry Smith ierr = MatSetSizes(*fact,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 747ca15aa20SStefano Zampini ierr = MatSetType(*fact,MATDENSE);CHKERRQ(ierr); 748db4efbfdSBarry Smith if (ftype == MAT_FACTOR_LU) { 749db4efbfdSBarry Smith (*fact)->ops->lufactorsymbolic = MatLUFactorSymbolic_SeqDense; 750db4efbfdSBarry Smith } else { 751db4efbfdSBarry Smith (*fact)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqDense; 752db4efbfdSBarry Smith } 753d5f3da31SBarry Smith (*fact)->factortype = ftype; 75400c67f3bSHong Zhang 75500c67f3bSHong Zhang ierr = PetscFree((*fact)->solvertype);CHKERRQ(ierr); 75600c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&(*fact)->solvertype);CHKERRQ(ierr); 757db4efbfdSBarry Smith PetscFunctionReturn(0); 758db4efbfdSBarry Smith } 759db4efbfdSBarry Smith 760289bc588SBarry Smith /* ------------------------------------------------------------------*/ 761e0877f53SBarry Smith static PetscErrorCode MatSOR_SeqDense(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal shift,PetscInt its,PetscInt lits,Vec xx) 762289bc588SBarry Smith { 763c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 764d9ca1df4SBarry Smith PetscScalar *x,*v = mat->v,zero = 0.0,xt; 765d9ca1df4SBarry Smith const PetscScalar *b; 766dfbe8321SBarry Smith PetscErrorCode ierr; 767d0f46423SBarry Smith PetscInt m = A->rmap->n,i; 768c5df96a5SBarry Smith PetscBLASInt o = 1,bm; 769289bc588SBarry Smith 7703a40ed3dSBarry Smith PetscFunctionBegin; 771ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 772c70f7ee4SJunchao Zhang if (A->offloadmask == PETSC_OFFLOAD_GPU) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Not implemented"); 773ca15aa20SStefano Zampini #endif 774422a814eSBarry Smith if (shift == -1) shift = 0.0; /* negative shift indicates do not error on zero diagonal; this code never zeros on zero diagonal */ 775c5df96a5SBarry Smith ierr = PetscBLASIntCast(m,&bm);CHKERRQ(ierr); 776289bc588SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 7773bffc371SBarry Smith /* this is a hack fix, should have another version without the second BLASdotu */ 7782dcb1b2aSMatthew Knepley ierr = VecSet(xx,zero);CHKERRQ(ierr); 779289bc588SBarry Smith } 7801ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 781d9ca1df4SBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 782b965ef7fSBarry Smith its = its*lits; 783e32f2f54SBarry Smith if (its <= 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Relaxation requires global its %D and local its %D both positive",its,lits); 784289bc588SBarry Smith while (its--) { 785fccaa45eSBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 786289bc588SBarry Smith for (i=0; i<m; i++) { 7873bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 78855a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 789289bc588SBarry Smith } 790289bc588SBarry Smith } 791fccaa45eSBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 792289bc588SBarry Smith for (i=m-1; i>=0; i--) { 7933bffc371SBarry Smith PetscStackCallBLAS("BLASdotu",xt = b[i] - BLASdotu_(&bm,v+i,&bm,x,&o)); 79455a1b374SBarry Smith x[i] = (1. - omega)*x[i] + omega*(xt+v[i + i*m]*x[i])/(v[i + i*m]+shift); 795289bc588SBarry Smith } 796289bc588SBarry Smith } 797289bc588SBarry Smith } 798d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 7991ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 8003a40ed3dSBarry Smith PetscFunctionReturn(0); 801289bc588SBarry Smith } 802289bc588SBarry Smith 803289bc588SBarry Smith /* -----------------------------------------------------------------*/ 804ca15aa20SStefano Zampini PetscErrorCode MatMultTranspose_SeqDense(Mat A,Vec xx,Vec yy) 805289bc588SBarry Smith { 806c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 807d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 808d9ca1df4SBarry Smith PetscScalar *y; 809dfbe8321SBarry Smith PetscErrorCode ierr; 8100805154bSBarry Smith PetscBLASInt m, n,_One=1; 811ea709b57SSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 8123a40ed3dSBarry Smith 8133a40ed3dSBarry Smith PetscFunctionBegin; 814c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 815c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 816d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8172bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8185ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8195ac36cfcSBarry Smith PetscBLASInt i; 8205ac36cfcSBarry Smith for (i=0; i<n; i++) y[i] = 0.0; 8215ac36cfcSBarry Smith } else { 8228b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&mat->lda,x,&_One,&_DZero,y,&_One)); 8235ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->cmap->n);CHKERRQ(ierr); 8245ac36cfcSBarry Smith } 825d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8262bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8273a40ed3dSBarry Smith PetscFunctionReturn(0); 828289bc588SBarry Smith } 829800995b7SMatthew Knepley 830ca15aa20SStefano Zampini PetscErrorCode MatMult_SeqDense(Mat A,Vec xx,Vec yy) 831289bc588SBarry Smith { 832c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 833d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0,_DZero=0.0; 834dfbe8321SBarry Smith PetscErrorCode ierr; 8350805154bSBarry Smith PetscBLASInt m, n, _One=1; 836d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 8373a40ed3dSBarry Smith 8383a40ed3dSBarry Smith PetscFunctionBegin; 839c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 840c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 841d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8422bf066beSStefano Zampini ierr = VecGetArrayWrite(yy,&y);CHKERRQ(ierr); 8435ac36cfcSBarry Smith if (!A->rmap->n || !A->cmap->n) { 8445ac36cfcSBarry Smith PetscBLASInt i; 8455ac36cfcSBarry Smith for (i=0; i<m; i++) y[i] = 0.0; 8465ac36cfcSBarry Smith } else { 8478b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DZero,y,&_One)); 8485ac36cfcSBarry Smith ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n - A->rmap->n);CHKERRQ(ierr); 8495ac36cfcSBarry Smith } 850d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8512bf066beSStefano Zampini ierr = VecRestoreArrayWrite(yy,&y);CHKERRQ(ierr); 8523a40ed3dSBarry Smith PetscFunctionReturn(0); 853289bc588SBarry Smith } 8546ee01492SSatish Balay 855ca15aa20SStefano Zampini PetscErrorCode MatMultAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 856289bc588SBarry Smith { 857c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 858d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 859d9ca1df4SBarry Smith PetscScalar *y,_DOne=1.0; 860dfbe8321SBarry Smith PetscErrorCode ierr; 8610805154bSBarry Smith PetscBLASInt m, n, _One=1; 8623a40ed3dSBarry Smith 8633a40ed3dSBarry Smith PetscFunctionBegin; 864c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 865c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 866d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 867600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 868d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8691ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8708b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("N",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 871d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8721ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 873dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8743a40ed3dSBarry Smith PetscFunctionReturn(0); 875289bc588SBarry Smith } 8766ee01492SSatish Balay 877ca15aa20SStefano Zampini PetscErrorCode MatMultTransposeAdd_SeqDense(Mat A,Vec xx,Vec zz,Vec yy) 878289bc588SBarry Smith { 879c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 880d9ca1df4SBarry Smith const PetscScalar *v = mat->v,*x; 881d9ca1df4SBarry Smith PetscScalar *y; 882dfbe8321SBarry Smith PetscErrorCode ierr; 8830805154bSBarry Smith PetscBLASInt m, n, _One=1; 88487828ca2SBarry Smith PetscScalar _DOne=1.0; 8853a40ed3dSBarry Smith 8863a40ed3dSBarry Smith PetscFunctionBegin; 887c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&m);CHKERRQ(ierr); 888c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&n);CHKERRQ(ierr); 889d0f46423SBarry Smith if (!A->rmap->n || !A->cmap->n) PetscFunctionReturn(0); 890600d6d0bSBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 891d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 8921ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 8938b83055fSJed Brown PetscStackCallBLAS("BLASgemv",BLASgemv_("T",&m,&n,&_DOne,v,&(mat->lda),x,&_One,&_DOne,y,&_One)); 894d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 8951ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 896dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->rmap->n*A->cmap->n);CHKERRQ(ierr); 8973a40ed3dSBarry Smith PetscFunctionReturn(0); 898289bc588SBarry Smith } 899289bc588SBarry Smith 900289bc588SBarry Smith /* -----------------------------------------------------------------*/ 901e0877f53SBarry Smith static PetscErrorCode MatGetRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 902289bc588SBarry Smith { 903c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 9046849ba73SBarry Smith PetscErrorCode ierr; 90513f74950SBarry Smith PetscInt i; 90667e560aaSBarry Smith 9073a40ed3dSBarry Smith PetscFunctionBegin; 908d0f46423SBarry Smith *ncols = A->cmap->n; 909289bc588SBarry Smith if (cols) { 910854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,cols);CHKERRQ(ierr); 911d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) (*cols)[i] = i; 912289bc588SBarry Smith } 913289bc588SBarry Smith if (vals) { 914ca15aa20SStefano Zampini const PetscScalar *v; 915ca15aa20SStefano Zampini 916ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 917854ce69bSBarry Smith ierr = PetscMalloc1(A->cmap->n+1,vals);CHKERRQ(ierr); 918ca15aa20SStefano Zampini v += row; 919d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) {(*vals)[i] = *v; v += mat->lda;} 920ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 921289bc588SBarry Smith } 9223a40ed3dSBarry Smith PetscFunctionReturn(0); 923289bc588SBarry Smith } 9246ee01492SSatish Balay 925e0877f53SBarry Smith static PetscErrorCode MatRestoreRow_SeqDense(Mat A,PetscInt row,PetscInt *ncols,PetscInt **cols,PetscScalar **vals) 926289bc588SBarry Smith { 927dfbe8321SBarry Smith PetscErrorCode ierr; 9286e111a19SKarl Rupp 929606d414cSSatish Balay PetscFunctionBegin; 930606d414cSSatish Balay if (cols) {ierr = PetscFree(*cols);CHKERRQ(ierr);} 931606d414cSSatish Balay if (vals) {ierr = PetscFree(*vals);CHKERRQ(ierr); } 9323a40ed3dSBarry Smith PetscFunctionReturn(0); 933289bc588SBarry Smith } 934289bc588SBarry Smith /* ----------------------------------------------------------------*/ 935e0877f53SBarry Smith static PetscErrorCode MatSetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],const PetscScalar v[],InsertMode addv) 936289bc588SBarry Smith { 937c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 938ca15aa20SStefano Zampini PetscScalar *av; 93913f74950SBarry Smith PetscInt i,j,idx=0; 940ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 941c70f7ee4SJunchao Zhang PetscOffloadMask oldf; 942ca15aa20SStefano Zampini #endif 943ca15aa20SStefano Zampini PetscErrorCode ierr; 944d6dfbf8fSBarry Smith 9453a40ed3dSBarry Smith PetscFunctionBegin; 946ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&av);CHKERRQ(ierr); 947289bc588SBarry Smith if (!mat->roworiented) { 948dbb450caSBarry Smith if (addv == INSERT_VALUES) { 949289bc588SBarry Smith for (j=0; j<n; j++) { 950cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 951cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 952289bc588SBarry Smith for (i=0; i<m; i++) { 953cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 954cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 955ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 956289bc588SBarry Smith } 957289bc588SBarry Smith } 9583a40ed3dSBarry Smith } else { 959289bc588SBarry Smith for (j=0; j<n; j++) { 960cddbea37SSatish Balay if (indexn[j] < 0) {idx += m; continue;} 961cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 962289bc588SBarry Smith for (i=0; i<m; i++) { 963cddbea37SSatish Balay if (indexm[i] < 0) {idx++; continue;} 964cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 965ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 966289bc588SBarry Smith } 967289bc588SBarry Smith } 968289bc588SBarry Smith } 9693a40ed3dSBarry Smith } else { 970dbb450caSBarry Smith if (addv == INSERT_VALUES) { 971e8d4e0b9SBarry Smith for (i=0; i<m; i++) { 972cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 973cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 974e8d4e0b9SBarry Smith for (j=0; j<n; j++) { 975cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 976cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 977ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] = v[idx++]; 978e8d4e0b9SBarry Smith } 979e8d4e0b9SBarry Smith } 9803a40ed3dSBarry Smith } else { 981289bc588SBarry Smith for (i=0; i<m; i++) { 982cddbea37SSatish Balay if (indexm[i] < 0) { idx += n; continue;} 983cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexm[i] >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",indexm[i],A->rmap->n-1); 984289bc588SBarry Smith for (j=0; j<n; j++) { 985cddbea37SSatish Balay if (indexn[j] < 0) { idx++; continue;} 986cf9c20a2SJed Brown if (PetscUnlikelyDebug(indexn[j] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",indexn[j],A->cmap->n-1); 987ca15aa20SStefano Zampini av[indexn[j]*mat->lda + indexm[i]] += v[idx++]; 988289bc588SBarry Smith } 989289bc588SBarry Smith } 990289bc588SBarry Smith } 991e8d4e0b9SBarry Smith } 992ca15aa20SStefano Zampini /* hack to prevent unneeded copy to the GPU while returning the array */ 993ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 994c70f7ee4SJunchao Zhang oldf = A->offloadmask; 995c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_GPU; 996ca15aa20SStefano Zampini #endif 997ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&av);CHKERRQ(ierr); 998ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 999c70f7ee4SJunchao Zhang A->offloadmask = (oldf == PETSC_OFFLOAD_UNALLOCATED ? PETSC_OFFLOAD_UNALLOCATED : PETSC_OFFLOAD_CPU); 1000ca15aa20SStefano Zampini #endif 10013a40ed3dSBarry Smith PetscFunctionReturn(0); 1002289bc588SBarry Smith } 1003e8d4e0b9SBarry Smith 1004e0877f53SBarry Smith static PetscErrorCode MatGetValues_SeqDense(Mat A,PetscInt m,const PetscInt indexm[],PetscInt n,const PetscInt indexn[],PetscScalar v[]) 1005ae80bb75SLois Curfman McInnes { 1006ae80bb75SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1007ca15aa20SStefano Zampini const PetscScalar *vv; 100813f74950SBarry Smith PetscInt i,j; 1009ca15aa20SStefano Zampini PetscErrorCode ierr; 1010ae80bb75SLois Curfman McInnes 10113a40ed3dSBarry Smith PetscFunctionBegin; 1012ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1013ae80bb75SLois Curfman McInnes /* row-oriented output */ 1014ae80bb75SLois Curfman McInnes for (i=0; i<m; i++) { 101597e567efSBarry Smith if (indexm[i] < 0) {v += n;continue;} 1016e32f2f54SBarry Smith if (indexm[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested larger than number rows %D",indexm[i],A->rmap->n); 1017ae80bb75SLois Curfman McInnes for (j=0; j<n; j++) { 10186f31f424SBarry Smith if (indexn[j] < 0) {v++; continue;} 1019e32f2f54SBarry Smith if (indexn[j] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column %D requested larger than number columns %D",indexn[j],A->cmap->n); 1020ca15aa20SStefano Zampini *v++ = vv[indexn[j]*mat->lda + indexm[i]]; 1021ae80bb75SLois Curfman McInnes } 1022ae80bb75SLois Curfman McInnes } 1023ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 10243a40ed3dSBarry Smith PetscFunctionReturn(0); 1025ae80bb75SLois Curfman McInnes } 1026ae80bb75SLois Curfman McInnes 1027289bc588SBarry Smith /* -----------------------------------------------------------------*/ 1028289bc588SBarry Smith 10298491ab44SLisandro Dalcin PetscErrorCode MatView_Dense_Binary(Mat mat,PetscViewer viewer) 1030aabbc4fbSShri Abhyankar { 1031aabbc4fbSShri Abhyankar PetscErrorCode ierr; 10328491ab44SLisandro Dalcin PetscBool skipHeader; 10338491ab44SLisandro Dalcin PetscViewerFormat format; 10348491ab44SLisandro Dalcin PetscInt header[4],M,N,m,lda,i,j,k; 10358491ab44SLisandro Dalcin const PetscScalar *v; 10368491ab44SLisandro Dalcin PetscScalar *vwork; 1037aabbc4fbSShri Abhyankar 1038aabbc4fbSShri Abhyankar PetscFunctionBegin; 10398491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10408491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10418491ab44SLisandro Dalcin ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 10428491ab44SLisandro Dalcin if (skipHeader) format = PETSC_VIEWER_NATIVE; 1043aabbc4fbSShri Abhyankar 10448491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 10458491ab44SLisandro Dalcin 10468491ab44SLisandro Dalcin /* write matrix header */ 10478491ab44SLisandro Dalcin header[0] = MAT_FILE_CLASSID; header[1] = M; header[2] = N; 10488491ab44SLisandro Dalcin header[3] = (format == PETSC_VIEWER_NATIVE) ? MATRIX_BINARY_FORMAT_DENSE : M*N; 10498491ab44SLisandro Dalcin if (!skipHeader) {ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr);} 10508491ab44SLisandro Dalcin 10518491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 10528491ab44SLisandro Dalcin if (format != PETSC_VIEWER_NATIVE) { 10538491ab44SLisandro Dalcin PetscInt nnz = m*N, *iwork; 10548491ab44SLisandro Dalcin /* store row lengths for each row */ 10558491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&iwork);CHKERRQ(ierr); 10568491ab44SLisandro Dalcin for (i=0; i<m; i++) iwork[i] = N; 10578491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10588491ab44SLisandro Dalcin /* store column indices (zero start index) */ 10598491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10608491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10618491ab44SLisandro Dalcin iwork[k] = j; 10628491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,iwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 10638491ab44SLisandro Dalcin ierr = PetscFree(iwork);CHKERRQ(ierr); 10648491ab44SLisandro Dalcin } 10658491ab44SLisandro Dalcin /* store matrix values as a dense matrix in row major order */ 10668491ab44SLisandro Dalcin ierr = PetscMalloc1(m*N,&vwork);CHKERRQ(ierr); 10678491ab44SLisandro Dalcin ierr = MatDenseGetArrayRead(mat,&v);CHKERRQ(ierr); 10688491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 10698491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 10708491ab44SLisandro Dalcin for (j=0; j<N; j++, k++) 10718491ab44SLisandro Dalcin vwork[k] = v[i+lda*j]; 10728491ab44SLisandro Dalcin ierr = MatDenseRestoreArrayRead(mat,&v);CHKERRQ(ierr); 10738491ab44SLisandro Dalcin ierr = PetscViewerBinaryWriteAll(viewer,vwork,m*N,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 10748491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 10758491ab44SLisandro Dalcin PetscFunctionReturn(0); 10768491ab44SLisandro Dalcin } 10778491ab44SLisandro Dalcin 10788491ab44SLisandro Dalcin PetscErrorCode MatLoad_Dense_Binary(Mat mat,PetscViewer viewer) 10798491ab44SLisandro Dalcin { 10808491ab44SLisandro Dalcin PetscErrorCode ierr; 10818491ab44SLisandro Dalcin PetscBool skipHeader; 10828491ab44SLisandro Dalcin PetscInt header[4],M,N,m,nz,lda,i,j,k; 10838491ab44SLisandro Dalcin PetscInt rows,cols; 10848491ab44SLisandro Dalcin PetscScalar *v,*vwork; 10858491ab44SLisandro Dalcin 10868491ab44SLisandro Dalcin PetscFunctionBegin; 10878491ab44SLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 10888491ab44SLisandro Dalcin ierr = PetscViewerBinaryGetSkipHeader(viewer,&skipHeader);CHKERRQ(ierr); 10898491ab44SLisandro Dalcin 10908491ab44SLisandro Dalcin if (!skipHeader) { 10918491ab44SLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 10928491ab44SLisandro Dalcin if (header[0] != MAT_FILE_CLASSID) SETERRQ(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 10938491ab44SLisandro Dalcin M = header[1]; N = header[2]; 10948491ab44SLisandro Dalcin if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M); 10958491ab44SLisandro Dalcin if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N); 10968491ab44SLisandro Dalcin nz = header[3]; 10978491ab44SLisandro Dalcin if (nz != MATRIX_BINARY_FORMAT_DENSE && nz < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Unknown matrix format %D in file",nz); 1098aabbc4fbSShri Abhyankar } else { 10998491ab44SLisandro Dalcin ierr = MatGetSize(mat,&M,&N);CHKERRQ(ierr); 11008491ab44SLisandro Dalcin if (M < 0 || N < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Matrix binary file header was skipped, thus the user must specify the global sizes of input matrix"); 11018491ab44SLisandro Dalcin nz = MATRIX_BINARY_FORMAT_DENSE; 1102e6324fbbSBarry Smith } 1103aabbc4fbSShri Abhyankar 11048491ab44SLisandro Dalcin /* setup global sizes if not set */ 11058491ab44SLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 11068491ab44SLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 11078491ab44SLisandro Dalcin ierr = MatSetUp(mat);CHKERRQ(ierr); 11088491ab44SLisandro Dalcin /* check if global sizes are correct */ 11098491ab44SLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 11108491ab44SLisandro Dalcin if (M != rows || N != cols) SETERRQ4(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%d, %d) than the input matrix (%d, %d)",M,N,rows,cols); 1111aabbc4fbSShri Abhyankar 11128491ab44SLisandro Dalcin ierr = MatGetSize(mat,NULL,&N);CHKERRQ(ierr); 11138491ab44SLisandro Dalcin ierr = MatGetLocalSize(mat,&m,NULL);CHKERRQ(ierr); 11148491ab44SLisandro Dalcin ierr = MatDenseGetArray(mat,&v);CHKERRQ(ierr); 11158491ab44SLisandro Dalcin ierr = MatDenseGetLDA(mat,&lda);CHKERRQ(ierr); 11168491ab44SLisandro Dalcin if (nz == MATRIX_BINARY_FORMAT_DENSE) { /* matrix in file is dense format */ 11178491ab44SLisandro Dalcin PetscInt nnz = m*N; 11188491ab44SLisandro Dalcin /* read in matrix values */ 11198491ab44SLisandro Dalcin ierr = PetscMalloc1(nnz,&vwork);CHKERRQ(ierr); 11208491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11218491ab44SLisandro Dalcin /* store values in column major order */ 11228491ab44SLisandro Dalcin for (j=0; j<N; j++) 11238491ab44SLisandro Dalcin for (i=0; i<m; i++) 11248491ab44SLisandro Dalcin v[i+lda*j] = vwork[i*N+j]; 11258491ab44SLisandro Dalcin ierr = PetscFree(vwork);CHKERRQ(ierr); 11268491ab44SLisandro Dalcin } else { /* matrix in file is sparse format */ 11278491ab44SLisandro Dalcin PetscInt nnz = 0, *rlens, *icols; 11288491ab44SLisandro Dalcin /* read in row lengths */ 11298491ab44SLisandro Dalcin ierr = PetscMalloc1(m,&rlens);CHKERRQ(ierr); 11308491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,rlens,m,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11318491ab44SLisandro Dalcin for (i=0; i<m; i++) nnz += rlens[i]; 11328491ab44SLisandro Dalcin /* read in column indices and values */ 11338491ab44SLisandro Dalcin ierr = PetscMalloc2(nnz,&icols,nnz,&vwork);CHKERRQ(ierr); 11348491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,icols,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_INT);CHKERRQ(ierr); 11358491ab44SLisandro Dalcin ierr = PetscViewerBinaryReadAll(viewer,vwork,nnz,PETSC_DETERMINE,PETSC_DETERMINE,PETSC_SCALAR);CHKERRQ(ierr); 11368491ab44SLisandro Dalcin /* store values in column major order */ 11378491ab44SLisandro Dalcin for (k=0, i=0; i<m; i++) 11388491ab44SLisandro Dalcin for (j=0; j<rlens[i]; j++, k++) 11398491ab44SLisandro Dalcin v[i+lda*icols[k]] = vwork[k]; 11408491ab44SLisandro Dalcin ierr = PetscFree(rlens);CHKERRQ(ierr); 11418491ab44SLisandro Dalcin ierr = PetscFree2(icols,vwork);CHKERRQ(ierr); 1142aabbc4fbSShri Abhyankar } 11438491ab44SLisandro Dalcin ierr = MatDenseRestoreArray(mat,&v);CHKERRQ(ierr); 11448491ab44SLisandro Dalcin ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 11458491ab44SLisandro Dalcin ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1146aabbc4fbSShri Abhyankar PetscFunctionReturn(0); 1147aabbc4fbSShri Abhyankar } 1148aabbc4fbSShri Abhyankar 1149eb91f321SVaclav Hapla PetscErrorCode MatLoad_SeqDense(Mat newMat, PetscViewer viewer) 1150eb91f321SVaclav Hapla { 1151eb91f321SVaclav Hapla PetscBool isbinary, ishdf5; 1152eb91f321SVaclav Hapla PetscErrorCode ierr; 1153eb91f321SVaclav Hapla 1154eb91f321SVaclav Hapla PetscFunctionBegin; 1155eb91f321SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 1156eb91f321SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 1157eb91f321SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 1158eb91f321SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 1159eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1160eb91f321SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 1161eb91f321SVaclav Hapla if (isbinary) { 11628491ab44SLisandro Dalcin ierr = MatLoad_Dense_Binary(newMat,viewer);CHKERRQ(ierr); 1163eb91f321SVaclav Hapla } else if (ishdf5) { 1164eb91f321SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 1165eb91f321SVaclav Hapla ierr = MatLoad_Dense_HDF5(newMat,viewer);CHKERRQ(ierr); 1166eb91f321SVaclav Hapla #else 1167eb91f321SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 1168eb91f321SVaclav Hapla #endif 1169eb91f321SVaclav Hapla } else { 1170eb91f321SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 1171eb91f321SVaclav Hapla } 1172eb91f321SVaclav Hapla PetscFunctionReturn(0); 1173eb91f321SVaclav Hapla } 1174eb91f321SVaclav Hapla 11756849ba73SBarry Smith static PetscErrorCode MatView_SeqDense_ASCII(Mat A,PetscViewer viewer) 1176289bc588SBarry Smith { 1177932b0c3eSLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1178dfbe8321SBarry Smith PetscErrorCode ierr; 117913f74950SBarry Smith PetscInt i,j; 11802dcb1b2aSMatthew Knepley const char *name; 1181ca15aa20SStefano Zampini PetscScalar *v,*av; 1182f3ef73ceSBarry Smith PetscViewerFormat format; 11835f481a85SSatish Balay #if defined(PETSC_USE_COMPLEX) 1184ace3abfcSBarry Smith PetscBool allreal = PETSC_TRUE; 11855f481a85SSatish Balay #endif 1186932b0c3eSLois Curfman McInnes 11873a40ed3dSBarry Smith PetscFunctionBegin; 1188ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1189b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1190456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 11913a40ed3dSBarry Smith PetscFunctionReturn(0); /* do nothing for now */ 1192fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 1193d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1194d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1195ca15aa20SStefano Zampini v = av + i; 119677431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 1197d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1198aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 1199329f5518SBarry Smith if (PetscRealPart(*v) != 0.0 && PetscImaginaryPart(*v) != 0.0) { 120057622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",j,(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 1201329f5518SBarry Smith } else if (PetscRealPart(*v)) { 120257622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)PetscRealPart(*v));CHKERRQ(ierr); 12036831982aSBarry Smith } 120480cd9d93SLois Curfman McInnes #else 12056831982aSBarry Smith if (*v) { 120657622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",j,(double)*v);CHKERRQ(ierr); 12076831982aSBarry Smith } 120880cd9d93SLois Curfman McInnes #endif 12091b807ce4Svictorle v += a->lda; 121080cd9d93SLois Curfman McInnes } 1211b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 121280cd9d93SLois Curfman McInnes } 1213d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 12143a40ed3dSBarry Smith } else { 1215d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 1216aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 121747989497SBarry Smith /* determine if matrix has all real values */ 1218ca15aa20SStefano Zampini v = av; 1219d0f46423SBarry Smith for (i=0; i<A->rmap->n*A->cmap->n; i++) { 1220ffac6cdbSBarry Smith if (PetscImaginaryPart(v[i])) { allreal = PETSC_FALSE; break;} 122147989497SBarry Smith } 122247989497SBarry Smith #endif 1223fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 12243a7fca6bSBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 1225d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1226d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%s = zeros(%D,%D);\n",name,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 1227fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"%s = [\n",name);CHKERRQ(ierr); 1228ffac6cdbSBarry Smith } 1229ffac6cdbSBarry Smith 1230d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1231ca15aa20SStefano Zampini v = av + i; 1232d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1233aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 123447989497SBarry Smith if (allreal) { 1235c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)PetscRealPart(*v));CHKERRQ(ierr); 123647989497SBarry Smith } else { 1237c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e + %18.16ei ",(double)PetscRealPart(*v),(double)PetscImaginaryPart(*v));CHKERRQ(ierr); 123847989497SBarry Smith } 1239289bc588SBarry Smith #else 1240c61cd2faSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%18.16e ",(double)*v);CHKERRQ(ierr); 1241289bc588SBarry Smith #endif 12421b807ce4Svictorle v += a->lda; 1243289bc588SBarry Smith } 1244b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 1245289bc588SBarry Smith } 1246fb9695e5SSatish Balay if (format == PETSC_VIEWER_ASCII_MATLAB) { 1247b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"];\n");CHKERRQ(ierr); 1248ffac6cdbSBarry Smith } 1249d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 1250da3a660dSBarry Smith } 1251ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&av);CHKERRQ(ierr); 1252b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 12533a40ed3dSBarry Smith PetscFunctionReturn(0); 1254289bc588SBarry Smith } 1255289bc588SBarry Smith 12569804daf3SBarry Smith #include <petscdraw.h> 1257e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw_Zoom(PetscDraw draw,void *Aa) 1258f1af5d2fSBarry Smith { 1259f1af5d2fSBarry Smith Mat A = (Mat) Aa; 12606849ba73SBarry Smith PetscErrorCode ierr; 1261383922c3SLisandro Dalcin PetscInt m = A->rmap->n,n = A->cmap->n,i,j; 1262383922c3SLisandro Dalcin int color = PETSC_DRAW_WHITE; 1263ca15aa20SStefano Zampini const PetscScalar *v; 1264b0a32e0cSBarry Smith PetscViewer viewer; 1265b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 1266f3ef73ceSBarry Smith PetscViewerFormat format; 1267f1af5d2fSBarry Smith 1268f1af5d2fSBarry Smith PetscFunctionBegin; 1269f1af5d2fSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 1270b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 1271b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 1272f1af5d2fSBarry Smith 1273f1af5d2fSBarry Smith /* Loop over matrix elements drawing boxes */ 1274ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&v);CHKERRQ(ierr); 1275fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 1276383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1277f1af5d2fSBarry Smith /* Blue for negative and Red for positive */ 1278f1af5d2fSBarry Smith for (j = 0; j < n; j++) { 1279383922c3SLisandro Dalcin x_l = j; x_r = x_l + 1.0; 1280f1af5d2fSBarry Smith for (i = 0; i < m; i++) { 1281f1af5d2fSBarry Smith y_l = m - i - 1.0; 1282f1af5d2fSBarry Smith y_r = y_l + 1.0; 1283ca15aa20SStefano Zampini if (PetscRealPart(v[j*m+i]) > 0.) color = PETSC_DRAW_RED; 1284ca15aa20SStefano Zampini else if (PetscRealPart(v[j*m+i]) < 0.) color = PETSC_DRAW_BLUE; 1285ca15aa20SStefano Zampini else continue; 1286b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1287f1af5d2fSBarry Smith } 1288f1af5d2fSBarry Smith } 1289383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1290f1af5d2fSBarry Smith } else { 1291f1af5d2fSBarry Smith /* use contour shading to indicate magnitude of values */ 1292f1af5d2fSBarry Smith /* first determine max of all nonzero values */ 1293b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1294b05fc000SLisandro Dalcin PetscDraw popup; 1295b05fc000SLisandro Dalcin 1296f1af5d2fSBarry Smith for (i=0; i < m*n; i++) { 1297f1af5d2fSBarry Smith if (PetscAbsScalar(v[i]) > maxv) maxv = PetscAbsScalar(v[i]); 1298f1af5d2fSBarry Smith } 1299383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 1300b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 130145f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 1302383922c3SLisandro Dalcin 1303383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 1304f1af5d2fSBarry Smith for (j=0; j<n; j++) { 1305f1af5d2fSBarry Smith x_l = j; 1306f1af5d2fSBarry Smith x_r = x_l + 1.0; 1307f1af5d2fSBarry Smith for (i=0; i<m; i++) { 1308f1af5d2fSBarry Smith y_l = m - i - 1.0; 1309f1af5d2fSBarry Smith y_r = y_l + 1.0; 1310b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(v[j*m+i]),minv,maxv); 1311b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 1312f1af5d2fSBarry Smith } 1313f1af5d2fSBarry Smith } 1314383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 1315f1af5d2fSBarry Smith } 1316ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&v);CHKERRQ(ierr); 1317f1af5d2fSBarry Smith PetscFunctionReturn(0); 1318f1af5d2fSBarry Smith } 1319f1af5d2fSBarry Smith 1320e0877f53SBarry Smith static PetscErrorCode MatView_SeqDense_Draw(Mat A,PetscViewer viewer) 1321f1af5d2fSBarry Smith { 1322b0a32e0cSBarry Smith PetscDraw draw; 1323ace3abfcSBarry Smith PetscBool isnull; 1324329f5518SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1325dfbe8321SBarry Smith PetscErrorCode ierr; 1326f1af5d2fSBarry Smith 1327f1af5d2fSBarry Smith PetscFunctionBegin; 1328b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1329b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1330abc0a331SBarry Smith if (isnull) PetscFunctionReturn(0); 1331f1af5d2fSBarry Smith 1332d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1333f1af5d2fSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1334b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1335832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1336b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqDense_Draw_Zoom,A);CHKERRQ(ierr); 13370298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1338832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 1339f1af5d2fSBarry Smith PetscFunctionReturn(0); 1340f1af5d2fSBarry Smith } 1341f1af5d2fSBarry Smith 1342dfbe8321SBarry Smith PetscErrorCode MatView_SeqDense(Mat A,PetscViewer viewer) 1343932b0c3eSLois Curfman McInnes { 1344dfbe8321SBarry Smith PetscErrorCode ierr; 1345ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1346932b0c3eSLois Curfman McInnes 13473a40ed3dSBarry Smith PetscFunctionBegin; 1348251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1349251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1350251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 13510f5bd95cSBarry Smith 1352c45a1595SBarry Smith if (iascii) { 1353c45a1595SBarry Smith ierr = MatView_SeqDense_ASCII(A,viewer);CHKERRQ(ierr); 13540f5bd95cSBarry Smith } else if (isbinary) { 1355637a0070SStefano Zampini ierr = MatView_Dense_Binary(A,viewer);CHKERRQ(ierr); 1356f1af5d2fSBarry Smith } else if (isdraw) { 1357f1af5d2fSBarry Smith ierr = MatView_SeqDense_Draw(A,viewer);CHKERRQ(ierr); 1358932b0c3eSLois Curfman McInnes } 13593a40ed3dSBarry Smith PetscFunctionReturn(0); 1360932b0c3eSLois Curfman McInnes } 1361289bc588SBarry Smith 1362637a0070SStefano Zampini static PetscErrorCode MatDensePlaceArray_SeqDense(Mat A,const PetscScalar *array) 1363d3042a70SBarry Smith { 1364d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1365d3042a70SBarry Smith 1366d3042a70SBarry Smith PetscFunctionBegin; 13676947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1368d5ea218eSStefano Zampini if (a->unplacedarray) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreArray first"); 1369d3042a70SBarry Smith a->unplacedarray = a->v; 1370d3042a70SBarry Smith a->unplaced_user_alloc = a->user_alloc; 1371d3042a70SBarry Smith a->v = (PetscScalar*) array; 1372637a0070SStefano Zampini a->user_alloc = PETSC_TRUE; 1373ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1374c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1375ca15aa20SStefano Zampini #endif 1376d3042a70SBarry Smith PetscFunctionReturn(0); 1377d3042a70SBarry Smith } 1378d3042a70SBarry Smith 1379d3042a70SBarry Smith static PetscErrorCode MatDenseResetArray_SeqDense(Mat A) 1380d3042a70SBarry Smith { 1381d3042a70SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1382d3042a70SBarry Smith 1383d3042a70SBarry Smith PetscFunctionBegin; 13846947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1385d3042a70SBarry Smith a->v = a->unplacedarray; 1386d3042a70SBarry Smith a->user_alloc = a->unplaced_user_alloc; 1387d3042a70SBarry Smith a->unplacedarray = NULL; 1388ca15aa20SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1389c70f7ee4SJunchao Zhang A->offloadmask = PETSC_OFFLOAD_CPU; 1390ca15aa20SStefano Zampini #endif 1391d3042a70SBarry Smith PetscFunctionReturn(0); 1392d3042a70SBarry Smith } 1393d3042a70SBarry Smith 1394d5ea218eSStefano Zampini static PetscErrorCode MatDenseReplaceArray_SeqDense(Mat A,const PetscScalar *array) 1395d5ea218eSStefano Zampini { 1396d5ea218eSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 1397d5ea218eSStefano Zampini PetscErrorCode ierr; 1398d5ea218eSStefano Zampini 1399d5ea218eSStefano Zampini PetscFunctionBegin; 1400d5ea218eSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 1401d5ea218eSStefano Zampini if (!a->user_alloc) { ierr = PetscFree(a->v);CHKERRQ(ierr); } 1402d5ea218eSStefano Zampini a->v = (PetscScalar*) array; 1403d5ea218eSStefano Zampini a->user_alloc = PETSC_FALSE; 1404d5ea218eSStefano Zampini #if defined(PETSC_HAVE_CUDA) 1405d5ea218eSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1406d5ea218eSStefano Zampini #endif 1407d5ea218eSStefano Zampini PetscFunctionReturn(0); 1408d5ea218eSStefano Zampini } 1409d5ea218eSStefano Zampini 1410ca15aa20SStefano Zampini PetscErrorCode MatDestroy_SeqDense(Mat mat) 1411289bc588SBarry Smith { 1412ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)mat->data; 1413dfbe8321SBarry Smith PetscErrorCode ierr; 141490f02eecSBarry Smith 14153a40ed3dSBarry Smith PetscFunctionBegin; 1416aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1417d0f46423SBarry Smith PetscLogObjectState((PetscObject)mat,"Rows %D Cols %D",mat->rmap->n,mat->cmap->n); 1418a5a9c739SBarry Smith #endif 141905b42c5fSBarry Smith ierr = PetscFree(l->pivots);CHKERRQ(ierr); 1420a49dc2a2SStefano Zampini ierr = PetscFree(l->fwork);CHKERRQ(ierr); 1421abc3b08eSStefano Zampini ierr = MatDestroy(&l->ptapwork);CHKERRQ(ierr); 14226857c123SSatish Balay if (!l->user_alloc) {ierr = PetscFree(l->v);CHKERRQ(ierr);} 1423637a0070SStefano Zampini if (!l->unplaced_user_alloc) {ierr = PetscFree(l->unplacedarray);CHKERRQ(ierr);} 14246947451fSStefano Zampini ierr = VecDestroy(&l->cvec);CHKERRQ(ierr); 1425bf0cc555SLisandro Dalcin ierr = PetscFree(mat->data);CHKERRQ(ierr); 1426dbd8c25aSHong Zhang 1427dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)mat,0);CHKERRQ(ierr); 142849a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetLDA_C",NULL);CHKERRQ(ierr); 1429bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArray_C",NULL);CHKERRQ(ierr); 143052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArray_C",NULL);CHKERRQ(ierr); 1431d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDensePlaceArray_C",NULL);CHKERRQ(ierr); 1432d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseResetArray_C",NULL);CHKERRQ(ierr); 1433d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseReplaceArray_C",NULL);CHKERRQ(ierr); 143452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayRead_C",NULL);CHKERRQ(ierr); 143552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayRead_C",NULL);CHKERRQ(ierr); 14366947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetArrayWrite_C",NULL);CHKERRQ(ierr); 14376947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreArrayWrite_C",NULL);CHKERRQ(ierr); 14388baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 14398baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 14408baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_elemental_C",NULL);CHKERRQ(ierr); 14418baccfbdSHong Zhang #endif 14422bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 14432bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatConvert_seqdense_seqdensecuda_C",NULL);CHKERRQ(ierr); 14444222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",NULL);CHKERRQ(ierr); 14454222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdensecuda_seqdense_C",NULL);CHKERRQ(ierr); 14464222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",NULL);CHKERRQ(ierr); 14472bf066beSStefano Zampini #endif 1448bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatSeqDenseSetPreallocation_C",NULL);CHKERRQ(ierr); 14494222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14504222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqdense_seqdense_C",NULL);CHKERRQ(ierr); 1451bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1452bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14534222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1454a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 1455a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqbaij_seqdense_C",NULL);CHKERRQ(ierr); 14564222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatProductSetFromOptions_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1457c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 1458c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqsbaij_seqdense_C",NULL);CHKERRQ(ierr); 145952c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 146052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 146152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 146252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 146352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 146452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 146552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultSymbolic_nest_seqdense_C",NULL);CHKERRQ(ierr); 146652c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatMatMultNumeric_nest_seqdense_C",NULL);CHKERRQ(ierr); 146752c5f739Sprj- 14683bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 14693bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 147052c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 147152c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",NULL);CHKERRQ(ierr); 147252c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 147352c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",NULL);CHKERRQ(ierr); 147452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 147552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)mat,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",NULL);CHKERRQ(ierr); 147686aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumn_C",NULL);CHKERRQ(ierr); 147786aefd0dSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumn_C",NULL);CHKERRQ(ierr); 14786947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVec_C",NULL);CHKERRQ(ierr); 14796947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVec_C",NULL);CHKERRQ(ierr); 14806947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecRead_C",NULL);CHKERRQ(ierr); 14816947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecRead_C",NULL);CHKERRQ(ierr); 14826947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseGetColumnVecWrite_C",NULL);CHKERRQ(ierr); 14836947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)mat,"MatDenseRestoreColumnVecWrite_C",NULL);CHKERRQ(ierr); 14843a40ed3dSBarry Smith PetscFunctionReturn(0); 1485289bc588SBarry Smith } 1486289bc588SBarry Smith 1487e0877f53SBarry Smith static PetscErrorCode MatTranspose_SeqDense(Mat A,MatReuse reuse,Mat *matout) 1488289bc588SBarry Smith { 1489c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 14906849ba73SBarry Smith PetscErrorCode ierr; 149113f74950SBarry Smith PetscInt k,j,m,n,M; 149287828ca2SBarry Smith PetscScalar *v,tmp; 149348b35521SBarry Smith 14943a40ed3dSBarry Smith PetscFunctionBegin; 1495ca15aa20SStefano Zampini m = A->rmap->n; M = mat->lda; n = A->cmap->n; 14962847e3fdSStefano Zampini if (reuse == MAT_INPLACE_MATRIX && m == n) { /* in place transpose */ 1497ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1498d3e5ee88SLois Curfman McInnes for (j=0; j<m; j++) { 1499289bc588SBarry Smith for (k=0; k<j; k++) { 15001b807ce4Svictorle tmp = v[j + k*M]; 15011b807ce4Svictorle v[j + k*M] = v[k + j*M]; 15021b807ce4Svictorle v[k + j*M] = tmp; 1503289bc588SBarry Smith } 1504289bc588SBarry Smith } 1505ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 15063a40ed3dSBarry Smith } else { /* out-of-place transpose */ 1507d3e5ee88SLois Curfman McInnes Mat tmat; 1508ec8511deSBarry Smith Mat_SeqDense *tmatd; 150987828ca2SBarry Smith PetscScalar *v2; 1510af36a384SStefano Zampini PetscInt M2; 1511ea709b57SSatish Balay 15122847e3fdSStefano Zampini if (reuse != MAT_REUSE_MATRIX) { 1513ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&tmat);CHKERRQ(ierr); 1514d0f46423SBarry Smith ierr = MatSetSizes(tmat,A->cmap->n,A->rmap->n,A->cmap->n,A->rmap->n);CHKERRQ(ierr); 15157adad957SLisandro Dalcin ierr = MatSetType(tmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 15160298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(tmat,NULL);CHKERRQ(ierr); 1517ca15aa20SStefano Zampini } else tmat = *matout; 1518ca15aa20SStefano Zampini 1519ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 1520ca15aa20SStefano Zampini ierr = MatDenseGetArray(tmat,&v2);CHKERRQ(ierr); 1521ec8511deSBarry Smith tmatd = (Mat_SeqDense*)tmat->data; 1522ca15aa20SStefano Zampini M2 = tmatd->lda; 1523d3e5ee88SLois Curfman McInnes for (j=0; j<n; j++) { 1524af36a384SStefano Zampini for (k=0; k<m; k++) v2[j + k*M2] = v[k + j*M]; 1525d3e5ee88SLois Curfman McInnes } 1526ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(tmat,&v2);CHKERRQ(ierr); 1527ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&v);CHKERRQ(ierr); 15286d4a8577SBarry Smith ierr = MatAssemblyBegin(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15296d4a8577SBarry Smith ierr = MatAssemblyEnd(tmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15302847e3fdSStefano Zampini if (reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX) *matout = tmat; 15312847e3fdSStefano Zampini else { 15322847e3fdSStefano Zampini ierr = MatHeaderMerge(A,&tmat);CHKERRQ(ierr); 15332847e3fdSStefano Zampini } 153448b35521SBarry Smith } 15353a40ed3dSBarry Smith PetscFunctionReturn(0); 1536289bc588SBarry Smith } 1537289bc588SBarry Smith 1538e0877f53SBarry Smith static PetscErrorCode MatEqual_SeqDense(Mat A1,Mat A2,PetscBool *flg) 1539289bc588SBarry Smith { 1540c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat1 = (Mat_SeqDense*)A1->data; 1541c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat2 = (Mat_SeqDense*)A2->data; 1542ca15aa20SStefano Zampini PetscInt i; 1543ca15aa20SStefano Zampini const PetscScalar *v1,*v2; 1544ca15aa20SStefano Zampini PetscErrorCode ierr; 15459ea5d5aeSSatish Balay 15463a40ed3dSBarry Smith PetscFunctionBegin; 1547d0f46423SBarry Smith if (A1->rmap->n != A2->rmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1548d0f46423SBarry Smith if (A1->cmap->n != A2->cmap->n) {*flg = PETSC_FALSE; PetscFunctionReturn(0);} 1549ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A1,&v1);CHKERRQ(ierr); 1550ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A2,&v2);CHKERRQ(ierr); 1551ca15aa20SStefano Zampini for (i=0; i<A1->cmap->n; i++) { 1552ca15aa20SStefano Zampini ierr = PetscArraycmp(v1,v2,A1->rmap->n,flg);CHKERRQ(ierr); 1553ca15aa20SStefano Zampini if (*flg == PETSC_FALSE) PetscFunctionReturn(0); 1554ca15aa20SStefano Zampini v1 += mat1->lda; 1555ca15aa20SStefano Zampini v2 += mat2->lda; 15561b807ce4Svictorle } 1557ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A1,&v1);CHKERRQ(ierr); 1558ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A2,&v2);CHKERRQ(ierr); 155977c4ece6SBarry Smith *flg = PETSC_TRUE; 15603a40ed3dSBarry Smith PetscFunctionReturn(0); 1561289bc588SBarry Smith } 1562289bc588SBarry Smith 1563e0877f53SBarry Smith static PetscErrorCode MatGetDiagonal_SeqDense(Mat A,Vec v) 1564289bc588SBarry Smith { 1565c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 156613f74950SBarry Smith PetscInt i,n,len; 1567ca15aa20SStefano Zampini PetscScalar *x; 1568ca15aa20SStefano Zampini const PetscScalar *vv; 1569ca15aa20SStefano Zampini PetscErrorCode ierr; 157044cd7ae7SLois Curfman McInnes 15713a40ed3dSBarry Smith PetscFunctionBegin; 15727a97a34bSBarry Smith ierr = VecGetSize(v,&n);CHKERRQ(ierr); 15731ebc52fbSHong Zhang ierr = VecGetArray(v,&x);CHKERRQ(ierr); 1574d0f46423SBarry Smith len = PetscMin(A->rmap->n,A->cmap->n); 1575ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&vv);CHKERRQ(ierr); 1576e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 157744cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 1578ca15aa20SStefano Zampini x[i] = vv[i*mat->lda + i]; 1579289bc588SBarry Smith } 1580ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&vv);CHKERRQ(ierr); 15811ebc52fbSHong Zhang ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 15823a40ed3dSBarry Smith PetscFunctionReturn(0); 1583289bc588SBarry Smith } 1584289bc588SBarry Smith 1585e0877f53SBarry Smith static PetscErrorCode MatDiagonalScale_SeqDense(Mat A,Vec ll,Vec rr) 1586289bc588SBarry Smith { 1587c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1588f1ceaac6SMatthew G. Knepley const PetscScalar *l,*r; 1589ca15aa20SStefano Zampini PetscScalar x,*v,*vv; 1590dfbe8321SBarry Smith PetscErrorCode ierr; 1591d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n; 159255659b69SBarry Smith 15933a40ed3dSBarry Smith PetscFunctionBegin; 1594ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&vv);CHKERRQ(ierr); 159528988994SBarry Smith if (ll) { 15967a97a34bSBarry Smith ierr = VecGetSize(ll,&m);CHKERRQ(ierr); 1597f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 1598e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vec wrong size"); 1599da3a660dSBarry Smith for (i=0; i<m; i++) { 1600da3a660dSBarry Smith x = l[i]; 1601ca15aa20SStefano Zampini v = vv + i; 1602b43bac26SStefano Zampini for (j=0; j<n; j++) { (*v) *= x; v+= mat->lda;} 1603da3a660dSBarry Smith } 1604f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 1605eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1606da3a660dSBarry Smith } 160728988994SBarry Smith if (rr) { 16087a97a34bSBarry Smith ierr = VecGetSize(rr,&n);CHKERRQ(ierr); 1609f1ceaac6SMatthew G. Knepley ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 1610e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vec wrong size"); 1611da3a660dSBarry Smith for (i=0; i<n; i++) { 1612da3a660dSBarry Smith x = r[i]; 1613ca15aa20SStefano Zampini v = vv + i*mat->lda; 16142205254eSKarl Rupp for (j=0; j<m; j++) (*v++) *= x; 1615da3a660dSBarry Smith } 1616f1ceaac6SMatthew G. Knepley ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 1617eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*n*m);CHKERRQ(ierr); 1618da3a660dSBarry Smith } 1619ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&vv);CHKERRQ(ierr); 16203a40ed3dSBarry Smith PetscFunctionReturn(0); 1621289bc588SBarry Smith } 1622289bc588SBarry Smith 1623ca15aa20SStefano Zampini PetscErrorCode MatNorm_SeqDense(Mat A,NormType type,PetscReal *nrm) 1624289bc588SBarry Smith { 1625c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 1626ca15aa20SStefano Zampini PetscScalar *v,*vv; 1627329f5518SBarry Smith PetscReal sum = 0.0; 1628d0f46423SBarry Smith PetscInt lda =mat->lda,m=A->rmap->n,i,j; 1629efee365bSSatish Balay PetscErrorCode ierr; 163055659b69SBarry Smith 16313a40ed3dSBarry Smith PetscFunctionBegin; 1632ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 1633ca15aa20SStefano Zampini v = vv; 1634289bc588SBarry Smith if (type == NORM_FROBENIUS) { 1635a5ce6ee0Svictorle if (lda>m) { 1636d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1637ca15aa20SStefano Zampini v = vv+j*lda; 1638a5ce6ee0Svictorle for (i=0; i<m; i++) { 1639a5ce6ee0Svictorle sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1640a5ce6ee0Svictorle } 1641a5ce6ee0Svictorle } 1642a5ce6ee0Svictorle } else { 1643570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 1644570b7f6dSBarry Smith PetscBLASInt one = 1,cnt = A->cmap->n*A->rmap->n; 1645570b7f6dSBarry Smith *nrm = BLASnrm2_(&cnt,v,&one); 1646570b7f6dSBarry Smith } 1647570b7f6dSBarry Smith #else 1648d0f46423SBarry Smith for (i=0; i<A->cmap->n*A->rmap->n; i++) { 1649329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 1650289bc588SBarry Smith } 1651a5ce6ee0Svictorle } 16528f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 1653570b7f6dSBarry Smith #endif 1654dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16553a40ed3dSBarry Smith } else if (type == NORM_1) { 1656064f8208SBarry Smith *nrm = 0.0; 1657d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1658ca15aa20SStefano Zampini v = vv + j*mat->lda; 1659289bc588SBarry Smith sum = 0.0; 1660d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 166133a8263dSBarry Smith sum += PetscAbsScalar(*v); v++; 1662289bc588SBarry Smith } 1663064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1664289bc588SBarry Smith } 1665eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 16663a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 1667064f8208SBarry Smith *nrm = 0.0; 1668d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 1669ca15aa20SStefano Zampini v = vv + j; 1670289bc588SBarry Smith sum = 0.0; 1671d0f46423SBarry Smith for (i=0; i<A->cmap->n; i++) { 16721b807ce4Svictorle sum += PetscAbsScalar(*v); v += mat->lda; 1673289bc588SBarry Smith } 1674064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 1675289bc588SBarry Smith } 1676eb3f19e4SBarry Smith ierr = PetscLogFlops(1.0*A->cmap->n*A->rmap->n);CHKERRQ(ierr); 1677e7e72b3dSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No two norm"); 1678ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,(const PetscScalar**)&vv);CHKERRQ(ierr); 16793a40ed3dSBarry Smith PetscFunctionReturn(0); 1680289bc588SBarry Smith } 1681289bc588SBarry Smith 1682e0877f53SBarry Smith static PetscErrorCode MatSetOption_SeqDense(Mat A,MatOption op,PetscBool flg) 1683289bc588SBarry Smith { 1684c0bbcb79SLois Curfman McInnes Mat_SeqDense *aij = (Mat_SeqDense*)A->data; 168563ba0a88SBarry Smith PetscErrorCode ierr; 168667e560aaSBarry Smith 16873a40ed3dSBarry Smith PetscFunctionBegin; 1688b5a2b587SKris Buschelman switch (op) { 1689b5a2b587SKris Buschelman case MAT_ROW_ORIENTED: 16904e0d8c25SBarry Smith aij->roworiented = flg; 1691b5a2b587SKris Buschelman break; 1692512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1693b5a2b587SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 16943971808eSMatthew Knepley case MAT_NEW_NONZERO_ALLOCATION_ERR: 16954e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 169613fa8e87SLisandro Dalcin case MAT_KEEP_NONZERO_PATTERN: 1697b5a2b587SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1698b5a2b587SKris Buschelman case MAT_USE_HASH_TABLE: 16990f8fb01aSBarry Smith case MAT_IGNORE_ZERO_ENTRIES: 17005021d80fSJed Brown case MAT_IGNORE_LOWER_TRIANGULAR: 1701071fcb05SBarry Smith case MAT_SORTED_FULL: 17025021d80fSJed Brown ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 17035021d80fSJed Brown break; 17045021d80fSJed Brown case MAT_SPD: 170577e54ba9SKris Buschelman case MAT_SYMMETRIC: 170677e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 17079a4540c5SBarry Smith case MAT_HERMITIAN: 17089a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 17095021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 171077e54ba9SKris Buschelman break; 1711b5a2b587SKris Buschelman default: 1712e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %s",MatOptions[op]); 17133a40ed3dSBarry Smith } 17143a40ed3dSBarry Smith PetscFunctionReturn(0); 1715289bc588SBarry Smith } 1716289bc588SBarry Smith 1717e0877f53SBarry Smith static PetscErrorCode MatZeroEntries_SeqDense(Mat A) 17186f0a148fSBarry Smith { 1719ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 17206849ba73SBarry Smith PetscErrorCode ierr; 1721d0f46423SBarry Smith PetscInt lda=l->lda,m=A->rmap->n,j; 1722ca15aa20SStefano Zampini PetscScalar *v; 17233a40ed3dSBarry Smith 17243a40ed3dSBarry Smith PetscFunctionBegin; 1725ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 1726a5ce6ee0Svictorle if (lda>m) { 1727d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 1728ca15aa20SStefano Zampini ierr = PetscArrayzero(v+j*lda,m);CHKERRQ(ierr); 1729a5ce6ee0Svictorle } 1730a5ce6ee0Svictorle } else { 1731ca15aa20SStefano Zampini ierr = PetscArrayzero(v,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 1732a5ce6ee0Svictorle } 1733ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17343a40ed3dSBarry Smith PetscFunctionReturn(0); 17356f0a148fSBarry Smith } 17366f0a148fSBarry Smith 1737e0877f53SBarry Smith static PetscErrorCode MatZeroRows_SeqDense(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 17386f0a148fSBarry Smith { 173997b48c8fSBarry Smith PetscErrorCode ierr; 1740ec8511deSBarry Smith Mat_SeqDense *l = (Mat_SeqDense*)A->data; 1741b9679d65SBarry Smith PetscInt m = l->lda, n = A->cmap->n, i,j; 1742ca15aa20SStefano Zampini PetscScalar *slot,*bb,*v; 174397b48c8fSBarry Smith const PetscScalar *xx; 174455659b69SBarry Smith 17453a40ed3dSBarry Smith PetscFunctionBegin; 174676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 1747b9679d65SBarry Smith for (i=0; i<N; i++) { 1748b9679d65SBarry Smith if (rows[i] < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row requested to be zeroed"); 1749b9679d65SBarry Smith if (rows[i] >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D requested to be zeroed greater than or equal number of rows %D",rows[i],A->rmap->n); 1750b9679d65SBarry Smith } 175176bd3646SJed Brown } 1752ca15aa20SStefano Zampini if (!N) PetscFunctionReturn(0); 1753b9679d65SBarry Smith 175497b48c8fSBarry Smith /* fix right hand side if needed */ 175597b48c8fSBarry Smith if (x && b) { 175697b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 175797b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 17582205254eSKarl Rupp for (i=0; i<N; i++) bb[rows[i]] = diag*xx[rows[i]]; 175997b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 176097b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 176197b48c8fSBarry Smith } 176297b48c8fSBarry Smith 1763ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 17646f0a148fSBarry Smith for (i=0; i<N; i++) { 1765ca15aa20SStefano Zampini slot = v + rows[i]; 1766b9679d65SBarry Smith for (j=0; j<n; j++) { *slot = 0.0; slot += m;} 17676f0a148fSBarry Smith } 1768f4df32b1SMatthew Knepley if (diag != 0.0) { 1769b9679d65SBarry Smith if (A->rmap->n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only coded for square matrices"); 17706f0a148fSBarry Smith for (i=0; i<N; i++) { 1771ca15aa20SStefano Zampini slot = v + (m+1)*rows[i]; 1772f4df32b1SMatthew Knepley *slot = diag; 17736f0a148fSBarry Smith } 17746f0a148fSBarry Smith } 1775ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 17763a40ed3dSBarry Smith PetscFunctionReturn(0); 17776f0a148fSBarry Smith } 1778557bce09SLois Curfman McInnes 177949a6ff4bSBarry Smith static PetscErrorCode MatDenseGetLDA_SeqDense(Mat A,PetscInt *lda) 178049a6ff4bSBarry Smith { 178149a6ff4bSBarry Smith Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 178249a6ff4bSBarry Smith 178349a6ff4bSBarry Smith PetscFunctionBegin; 178449a6ff4bSBarry Smith *lda = mat->lda; 178549a6ff4bSBarry Smith PetscFunctionReturn(0); 178649a6ff4bSBarry Smith } 178749a6ff4bSBarry Smith 1788637a0070SStefano Zampini PetscErrorCode MatDenseGetArray_SeqDense(Mat A,PetscScalar **array) 178964e87e97SBarry Smith { 1790c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 17913a40ed3dSBarry Smith 17923a40ed3dSBarry Smith PetscFunctionBegin; 179364e87e97SBarry Smith *array = mat->v; 17943a40ed3dSBarry Smith PetscFunctionReturn(0); 179564e87e97SBarry Smith } 17960754003eSLois Curfman McInnes 1797637a0070SStefano Zampini PetscErrorCode MatDenseRestoreArray_SeqDense(Mat A,PetscScalar **array) 1798ff14e315SSatish Balay { 17993a40ed3dSBarry Smith PetscFunctionBegin; 1800637a0070SStefano Zampini *array = NULL; 18013a40ed3dSBarry Smith PetscFunctionReturn(0); 1802ff14e315SSatish Balay } 18030754003eSLois Curfman McInnes 1804dec5eb66SMatthew G Knepley /*@C 180549a6ff4bSBarry Smith MatDenseGetLDA - gets the leading dimension of the array returned from MatDenseGetArray() 180649a6ff4bSBarry Smith 180749a6ff4bSBarry Smith Logically Collective on Mat 180849a6ff4bSBarry Smith 180949a6ff4bSBarry Smith Input Parameter: 181049a6ff4bSBarry Smith . mat - a MATSEQDENSE or MATMPIDENSE matrix 181149a6ff4bSBarry Smith 181249a6ff4bSBarry Smith Output Parameter: 181349a6ff4bSBarry Smith . lda - the leading dimension 181449a6ff4bSBarry Smith 181549a6ff4bSBarry Smith Level: intermediate 181649a6ff4bSBarry Smith 181749a6ff4bSBarry Smith .seealso: MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatSeqDenseSetLDA() 181849a6ff4bSBarry Smith @*/ 181949a6ff4bSBarry Smith PetscErrorCode MatDenseGetLDA(Mat A,PetscInt *lda) 182049a6ff4bSBarry Smith { 182149a6ff4bSBarry Smith PetscErrorCode ierr; 182249a6ff4bSBarry Smith 182349a6ff4bSBarry Smith PetscFunctionBegin; 1824d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1825d5ea218eSStefano Zampini PetscValidPointer(lda,2); 182649a6ff4bSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetLDA_C",(Mat,PetscInt*),(A,lda));CHKERRQ(ierr); 182749a6ff4bSBarry Smith PetscFunctionReturn(0); 182849a6ff4bSBarry Smith } 182949a6ff4bSBarry Smith 183049a6ff4bSBarry Smith /*@C 18316947451fSStefano Zampini MatDenseGetArray - gives read-write access to the array where the data for a dense matrix is stored 183273a71a0fSBarry Smith 18338572280aSBarry Smith Logically Collective on Mat 183473a71a0fSBarry Smith 183573a71a0fSBarry Smith Input Parameter: 18366947451fSStefano Zampini . mat - a dense matrix 183773a71a0fSBarry Smith 183873a71a0fSBarry Smith Output Parameter: 183973a71a0fSBarry Smith . array - pointer to the data 184073a71a0fSBarry Smith 184173a71a0fSBarry Smith Level: intermediate 184273a71a0fSBarry Smith 18436947451fSStefano Zampini .seealso: MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 184473a71a0fSBarry Smith @*/ 18458c778c55SBarry Smith PetscErrorCode MatDenseGetArray(Mat A,PetscScalar **array) 184673a71a0fSBarry Smith { 184773a71a0fSBarry Smith PetscErrorCode ierr; 184873a71a0fSBarry Smith 184973a71a0fSBarry Smith PetscFunctionBegin; 1850d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1851d5ea218eSStefano Zampini PetscValidPointer(array,2); 18528c778c55SBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 185373a71a0fSBarry Smith PetscFunctionReturn(0); 185473a71a0fSBarry Smith } 185573a71a0fSBarry Smith 1856dec5eb66SMatthew G Knepley /*@C 1857579dbff0SBarry Smith MatDenseRestoreArray - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArray() 185873a71a0fSBarry Smith 18598572280aSBarry Smith Logically Collective on Mat 18608572280aSBarry Smith 18618572280aSBarry Smith Input Parameters: 18626947451fSStefano Zampini + mat - a dense matrix 1863a2b725a8SWilliam Gropp - array - pointer to the data 18648572280aSBarry Smith 18658572280aSBarry Smith Level: intermediate 18668572280aSBarry Smith 18676947451fSStefano Zampini .seealso: MatDenseGetArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 18688572280aSBarry Smith @*/ 18698572280aSBarry Smith PetscErrorCode MatDenseRestoreArray(Mat A,PetscScalar **array) 18708572280aSBarry Smith { 18718572280aSBarry Smith PetscErrorCode ierr; 18728572280aSBarry Smith 18738572280aSBarry Smith PetscFunctionBegin; 1874d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1875d5ea218eSStefano Zampini PetscValidPointer(array,2); 18768572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 18778572280aSBarry Smith ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 1878637a0070SStefano Zampini #if defined(PETSC_HAVE_CUDA) 1879637a0070SStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 1880637a0070SStefano Zampini #endif 18818572280aSBarry Smith PetscFunctionReturn(0); 18828572280aSBarry Smith } 18838572280aSBarry Smith 18848572280aSBarry Smith /*@C 18856947451fSStefano Zampini MatDenseGetArrayRead - gives read-only access to the array where the data for a dense matrix is stored 18868572280aSBarry Smith 18878572280aSBarry Smith Not Collective 18888572280aSBarry Smith 18898572280aSBarry Smith Input Parameter: 18906947451fSStefano Zampini . mat - a dense matrix 18918572280aSBarry Smith 18928572280aSBarry Smith Output Parameter: 18938572280aSBarry Smith . array - pointer to the data 18948572280aSBarry Smith 18958572280aSBarry Smith Level: intermediate 18968572280aSBarry Smith 18976947451fSStefano Zampini .seealso: MatDenseRestoreArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 18988572280aSBarry Smith @*/ 18998572280aSBarry Smith PetscErrorCode MatDenseGetArrayRead(Mat A,const PetscScalar **array) 19008572280aSBarry Smith { 19018572280aSBarry Smith PetscErrorCode ierr; 19028572280aSBarry Smith 19038572280aSBarry Smith PetscFunctionBegin; 1904d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1905d5ea218eSStefano Zampini PetscValidPointer(array,2); 19068572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseGetArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 19078572280aSBarry Smith PetscFunctionReturn(0); 19088572280aSBarry Smith } 19098572280aSBarry Smith 19108572280aSBarry Smith /*@C 19116947451fSStefano Zampini MatDenseRestoreArrayRead - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayRead() 19128572280aSBarry Smith 191373a71a0fSBarry Smith Not Collective 191473a71a0fSBarry Smith 191573a71a0fSBarry Smith Input Parameters: 19166947451fSStefano Zampini + mat - a dense matrix 1917a2b725a8SWilliam Gropp - array - pointer to the data 191873a71a0fSBarry Smith 191973a71a0fSBarry Smith Level: intermediate 192073a71a0fSBarry Smith 19216947451fSStefano Zampini .seealso: MatDenseGetArrayRead(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayWrite(), MatDenseRestoreArrayWrite() 192273a71a0fSBarry Smith @*/ 19238572280aSBarry Smith PetscErrorCode MatDenseRestoreArrayRead(Mat A,const PetscScalar **array) 192473a71a0fSBarry Smith { 192573a71a0fSBarry Smith PetscErrorCode ierr; 192673a71a0fSBarry Smith 192773a71a0fSBarry Smith PetscFunctionBegin; 1928d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1929d5ea218eSStefano Zampini PetscValidPointer(array,2); 19308572280aSBarry Smith ierr = PetscUseMethod(A,"MatDenseRestoreArrayRead_C",(Mat,const PetscScalar**),(A,array));CHKERRQ(ierr); 193173a71a0fSBarry Smith PetscFunctionReturn(0); 193273a71a0fSBarry Smith } 193373a71a0fSBarry Smith 19346947451fSStefano Zampini /*@C 19356947451fSStefano Zampini MatDenseGetArrayWrite - gives write-only access to the array where the data for a dense matrix is stored 19366947451fSStefano Zampini 19376947451fSStefano Zampini Not Collective 19386947451fSStefano Zampini 19396947451fSStefano Zampini Input Parameter: 19406947451fSStefano Zampini . mat - a dense matrix 19416947451fSStefano Zampini 19426947451fSStefano Zampini Output Parameter: 19436947451fSStefano Zampini . array - pointer to the data 19446947451fSStefano Zampini 19456947451fSStefano Zampini Level: intermediate 19466947451fSStefano Zampini 19476947451fSStefano Zampini .seealso: MatDenseRestoreArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19486947451fSStefano Zampini @*/ 19496947451fSStefano Zampini PetscErrorCode MatDenseGetArrayWrite(Mat A,PetscScalar **array) 19506947451fSStefano Zampini { 19516947451fSStefano Zampini PetscErrorCode ierr; 19526947451fSStefano Zampini 19536947451fSStefano Zampini PetscFunctionBegin; 1954d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1955d5ea218eSStefano Zampini PetscValidPointer(array,2); 19566947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19576947451fSStefano Zampini PetscFunctionReturn(0); 19586947451fSStefano Zampini } 19596947451fSStefano Zampini 19606947451fSStefano Zampini /*@C 19616947451fSStefano Zampini MatDenseRestoreArrayWrite - returns access to the array where the data for a dense matrix is stored obtained by MatDenseGetArrayWrite() 19626947451fSStefano Zampini 19636947451fSStefano Zampini Not Collective 19646947451fSStefano Zampini 19656947451fSStefano Zampini Input Parameters: 19666947451fSStefano Zampini + mat - a dense matrix 19676947451fSStefano Zampini - array - pointer to the data 19686947451fSStefano Zampini 19696947451fSStefano Zampini Level: intermediate 19706947451fSStefano Zampini 19716947451fSStefano Zampini .seealso: MatDenseGetArrayWrite(), MatDenseGetArray(), MatDenseRestoreArray(), MatDenseGetArrayRead(), MatDenseRestoreArrayRead() 19726947451fSStefano Zampini @*/ 19736947451fSStefano Zampini PetscErrorCode MatDenseRestoreArrayWrite(Mat A,PetscScalar **array) 19746947451fSStefano Zampini { 19756947451fSStefano Zampini PetscErrorCode ierr; 19766947451fSStefano Zampini 19776947451fSStefano Zampini PetscFunctionBegin; 1978d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 1979d5ea218eSStefano Zampini PetscValidPointer(array,2); 19806947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreArrayWrite_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 19816947451fSStefano Zampini ierr = PetscObjectStateIncrease((PetscObject)A);CHKERRQ(ierr); 19826947451fSStefano Zampini #if defined(PETSC_HAVE_CUDA) 19836947451fSStefano Zampini A->offloadmask = PETSC_OFFLOAD_CPU; 19846947451fSStefano Zampini #endif 19856947451fSStefano Zampini PetscFunctionReturn(0); 19866947451fSStefano Zampini } 19876947451fSStefano Zampini 19887dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrix_SeqDense(Mat A,IS isrow,IS iscol,PetscInt cs,MatReuse scall,Mat *B) 19890754003eSLois Curfman McInnes { 1990c0bbcb79SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)A->data; 19916849ba73SBarry Smith PetscErrorCode ierr; 1992ca15aa20SStefano Zampini PetscInt i,j,nrows,ncols,blda; 19935d0c19d7SBarry Smith const PetscInt *irow,*icol; 199487828ca2SBarry Smith PetscScalar *av,*bv,*v = mat->v; 19950754003eSLois Curfman McInnes Mat newmat; 19960754003eSLois Curfman McInnes 19973a40ed3dSBarry Smith PetscFunctionBegin; 199878b31e54SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 199978b31e54SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 2000e03a110bSBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2001e03a110bSBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 20020754003eSLois Curfman McInnes 2003182d2002SSatish Balay /* Check submatrixcall */ 2004182d2002SSatish Balay if (scall == MAT_REUSE_MATRIX) { 200513f74950SBarry Smith PetscInt n_cols,n_rows; 2006182d2002SSatish Balay ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 200721a2c019SBarry Smith if (n_rows != nrows || n_cols != ncols) { 2008f746d493SDmitry Karpeev /* resize the result matrix to match number of requested rows/columns */ 2009c61587bbSBarry Smith ierr = MatSetSizes(*B,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 201021a2c019SBarry Smith } 2011182d2002SSatish Balay newmat = *B; 2012182d2002SSatish Balay } else { 20130754003eSLois Curfman McInnes /* Create and fill new matrix */ 2014ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&newmat);CHKERRQ(ierr); 2015f69a0ea3SMatthew Knepley ierr = MatSetSizes(newmat,nrows,ncols,nrows,ncols);CHKERRQ(ierr); 20167adad957SLisandro Dalcin ierr = MatSetType(newmat,((PetscObject)A)->type_name);CHKERRQ(ierr); 20170298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(newmat,NULL);CHKERRQ(ierr); 2018182d2002SSatish Balay } 2019182d2002SSatish Balay 2020182d2002SSatish Balay /* Now extract the data pointers and do the copy,column at a time */ 2021ca15aa20SStefano Zampini ierr = MatDenseGetArray(newmat,&bv);CHKERRQ(ierr); 2022ca15aa20SStefano Zampini ierr = MatDenseGetLDA(newmat,&blda);CHKERRQ(ierr); 2023182d2002SSatish Balay for (i=0; i<ncols; i++) { 20246de62eeeSBarry Smith av = v + mat->lda*icol[i]; 2025ca15aa20SStefano Zampini for (j=0; j<nrows; j++) bv[j] = av[irow[j]]; 2026ca15aa20SStefano Zampini bv += blda; 20270754003eSLois Curfman McInnes } 2028ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(newmat,&bv);CHKERRQ(ierr); 2029182d2002SSatish Balay 2030182d2002SSatish Balay /* Assemble the matrices so that the correct flags are set */ 20316d4a8577SBarry Smith ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20326d4a8577SBarry Smith ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20330754003eSLois Curfman McInnes 20340754003eSLois Curfman McInnes /* Free work space */ 203578b31e54SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 203678b31e54SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2037182d2002SSatish Balay *B = newmat; 20383a40ed3dSBarry Smith PetscFunctionReturn(0); 20390754003eSLois Curfman McInnes } 20400754003eSLois Curfman McInnes 20417dae84e0SHong Zhang static PetscErrorCode MatCreateSubMatrices_SeqDense(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2042905e6a2fSBarry Smith { 20436849ba73SBarry Smith PetscErrorCode ierr; 204413f74950SBarry Smith PetscInt i; 2045905e6a2fSBarry Smith 20463a40ed3dSBarry Smith PetscFunctionBegin; 2047905e6a2fSBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2048df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2049905e6a2fSBarry Smith } 2050905e6a2fSBarry Smith 2051905e6a2fSBarry Smith for (i=0; i<n; i++) { 20527dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqDense(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2053905e6a2fSBarry Smith } 20543a40ed3dSBarry Smith PetscFunctionReturn(0); 2055905e6a2fSBarry Smith } 2056905e6a2fSBarry Smith 2057e0877f53SBarry Smith static PetscErrorCode MatAssemblyBegin_SeqDense(Mat mat,MatAssemblyType mode) 2058c0aa2d19SHong Zhang { 2059c0aa2d19SHong Zhang PetscFunctionBegin; 2060c0aa2d19SHong Zhang PetscFunctionReturn(0); 2061c0aa2d19SHong Zhang } 2062c0aa2d19SHong Zhang 2063e0877f53SBarry Smith static PetscErrorCode MatAssemblyEnd_SeqDense(Mat mat,MatAssemblyType mode) 2064c0aa2d19SHong Zhang { 2065c0aa2d19SHong Zhang PetscFunctionBegin; 2066c0aa2d19SHong Zhang PetscFunctionReturn(0); 2067c0aa2d19SHong Zhang } 2068c0aa2d19SHong Zhang 2069e0877f53SBarry Smith static PetscErrorCode MatCopy_SeqDense(Mat A,Mat B,MatStructure str) 20704b0e389bSBarry Smith { 20714b0e389bSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data,*b = (Mat_SeqDense*)B->data; 20726849ba73SBarry Smith PetscErrorCode ierr; 2073ca15aa20SStefano Zampini const PetscScalar *va; 2074ca15aa20SStefano Zampini PetscScalar *vb; 2075d0f46423SBarry Smith PetscInt lda1=a->lda,lda2=b->lda, m=A->rmap->n,n=A->cmap->n, j; 20763a40ed3dSBarry Smith 20773a40ed3dSBarry Smith PetscFunctionBegin; 207833f4a19fSKris Buschelman /* If the two matrices don't have the same copy implementation, they aren't compatible for fast copy. */ 207933f4a19fSKris Buschelman if (A->ops->copy != B->ops->copy) { 2080cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 20813a40ed3dSBarry Smith PetscFunctionReturn(0); 20823a40ed3dSBarry Smith } 2083e32f2f54SBarry Smith if (m != B->rmap->n || n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"size(B) != size(A)"); 2084ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&va);CHKERRQ(ierr); 2085ca15aa20SStefano Zampini ierr = MatDenseGetArray(B,&vb);CHKERRQ(ierr); 2086a5ce6ee0Svictorle if (lda1>m || lda2>m) { 20870dbb7854Svictorle for (j=0; j<n; j++) { 2088ca15aa20SStefano Zampini ierr = PetscArraycpy(vb+j*lda2,va+j*lda1,m);CHKERRQ(ierr); 2089a5ce6ee0Svictorle } 2090a5ce6ee0Svictorle } else { 2091ca15aa20SStefano Zampini ierr = PetscArraycpy(vb,va,A->rmap->n*A->cmap->n);CHKERRQ(ierr); 2092a5ce6ee0Svictorle } 2093ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(B,&vb);CHKERRQ(ierr); 2094ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&va);CHKERRQ(ierr); 2095ca15aa20SStefano Zampini ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2096ca15aa20SStefano Zampini ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2097273d9f13SBarry Smith PetscFunctionReturn(0); 2098273d9f13SBarry Smith } 2099273d9f13SBarry Smith 2100e0877f53SBarry Smith static PetscErrorCode MatSetUp_SeqDense(Mat A) 2101273d9f13SBarry Smith { 2102dfbe8321SBarry Smith PetscErrorCode ierr; 2103273d9f13SBarry Smith 2104273d9f13SBarry Smith PetscFunctionBegin; 210518992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->rmap);CHKERRQ(ierr); 210618992e5dSStefano Zampini ierr = PetscLayoutSetUp(A->cmap);CHKERRQ(ierr); 210718992e5dSStefano Zampini if (!A->preallocated) { 2108273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(A,0);CHKERRQ(ierr); 210918992e5dSStefano Zampini } 21103a40ed3dSBarry Smith PetscFunctionReturn(0); 21114b0e389bSBarry Smith } 21124b0e389bSBarry Smith 2113ba337c44SJed Brown static PetscErrorCode MatConjugate_SeqDense(Mat A) 2114ba337c44SJed Brown { 2115ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2116ca15aa20SStefano Zampini PetscScalar *aa; 2117ca15aa20SStefano Zampini PetscErrorCode ierr; 2118ba337c44SJed Brown 2119ba337c44SJed Brown PetscFunctionBegin; 2120ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2121ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscConj(aa[i]); 2122ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2123ba337c44SJed Brown PetscFunctionReturn(0); 2124ba337c44SJed Brown } 2125ba337c44SJed Brown 2126ba337c44SJed Brown static PetscErrorCode MatRealPart_SeqDense(Mat A) 2127ba337c44SJed Brown { 2128ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2129ca15aa20SStefano Zampini PetscScalar *aa; 2130ca15aa20SStefano Zampini PetscErrorCode ierr; 2131ba337c44SJed Brown 2132ba337c44SJed Brown PetscFunctionBegin; 2133ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2134ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 2135ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2136ba337c44SJed Brown PetscFunctionReturn(0); 2137ba337c44SJed Brown } 2138ba337c44SJed Brown 2139ba337c44SJed Brown static PetscErrorCode MatImaginaryPart_SeqDense(Mat A) 2140ba337c44SJed Brown { 2141ba337c44SJed Brown PetscInt i,nz = A->rmap->n*A->cmap->n; 2142ca15aa20SStefano Zampini PetscScalar *aa; 2143ca15aa20SStefano Zampini PetscErrorCode ierr; 2144ba337c44SJed Brown 2145ba337c44SJed Brown PetscFunctionBegin; 2146ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&aa);CHKERRQ(ierr); 2147ba337c44SJed Brown for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 2148ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&aa);CHKERRQ(ierr); 2149ba337c44SJed Brown PetscFunctionReturn(0); 2150ba337c44SJed Brown } 2151284134d9SBarry Smith 2152a9fe9ddaSSatish Balay /* ----------------------------------------------------------------*/ 21534222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2154a9fe9ddaSSatish Balay { 2155ee16a9a1SHong Zhang PetscErrorCode ierr; 2156d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 21577a3c3d58SStefano Zampini PetscBool cisdense; 2158a9fe9ddaSSatish Balay 2159ee16a9a1SHong Zhang PetscFunctionBegin; 21604222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 21617a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 21627a3c3d58SStefano Zampini if (!cisdense) { 21637a3c3d58SStefano Zampini PetscBool flg; 21647a3c3d58SStefano Zampini 2165ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 21664222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 21677a3c3d58SStefano Zampini } 216818992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2169ee16a9a1SHong Zhang PetscFunctionReturn(0); 2170ee16a9a1SHong Zhang } 2171a9fe9ddaSSatish Balay 2172a9fe9ddaSSatish Balay PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2173a9fe9ddaSSatish Balay { 217452c5f739Sprj- Mat_SeqDense *a,*b=(Mat_SeqDense*)B->data,*c=(Mat_SeqDense*)C->data; 21750805154bSBarry Smith PetscBLASInt m,n,k; 2176ca15aa20SStefano Zampini const PetscScalar *av,*bv; 2177ca15aa20SStefano Zampini PetscScalar *cv; 2178a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2179fd4e9aacSBarry Smith PetscBool flg; 2180c2916339SPierre Jolivet PetscErrorCode (*numeric)(Mat,Mat,Mat)=NULL; 2181c2916339SPierre Jolivet PetscErrorCode ierr; 2182a9fe9ddaSSatish Balay 2183a9fe9ddaSSatish Balay PetscFunctionBegin; 2184fd4e9aacSBarry Smith /* Handle case where where user provided the final C matrix rather than calling MatMatMult() with MAT_INITIAL_MATRIX*/ 2185fd4e9aacSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&flg);CHKERRQ(ierr); 2186c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqAIJ_SeqDense; 2187a001520aSPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&flg);CHKERRQ(ierr); 2188c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqBAIJ_SeqDense; 2189c2916339SPierre Jolivet ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&flg);CHKERRQ(ierr); 2190c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_SeqSBAIJ_SeqDense; 219152c5f739Sprj- ierr = PetscObjectTypeCompare((PetscObject)A,MATNEST,&flg);CHKERRQ(ierr); 2192c2916339SPierre Jolivet if (flg) numeric = MatMatMultNumeric_Nest_Dense; 2193c2916339SPierre Jolivet if (numeric) { 2194c2916339SPierre Jolivet C->ops->matmultnumeric = numeric; 2195c2916339SPierre Jolivet ierr = (*numeric)(A,B,C);CHKERRQ(ierr); 219652c5f739Sprj- PetscFunctionReturn(0); 219752c5f739Sprj- } 219852c5f739Sprj- a = (Mat_SeqDense*)A->data; 21998208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 22008208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2201c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 220249d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 2203ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&av);CHKERRQ(ierr); 2204ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(B,&bv);CHKERRQ(ierr); 2205ca15aa20SStefano Zampini ierr = MatDenseGetArray(C,&cv);CHKERRQ(ierr); 2206ca15aa20SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","N",&m,&n,&k,&_DOne,av,&a->lda,bv,&b->lda,&_DZero,cv,&c->lda)); 2207ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2208ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&av);CHKERRQ(ierr); 2209ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(B,&bv);CHKERRQ(ierr); 2210ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(C,&cv);CHKERRQ(ierr); 2211a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2212a9fe9ddaSSatish Balay } 2213a9fe9ddaSSatish Balay 22144222ddf1SHong Zhang PetscErrorCode MatMatTransposeMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 221569f65d41SStefano Zampini { 221669f65d41SStefano Zampini PetscErrorCode ierr; 221769f65d41SStefano Zampini PetscInt m=A->rmap->n,n=B->rmap->n; 22187a3c3d58SStefano Zampini PetscBool cisdense; 221969f65d41SStefano Zampini 222069f65d41SStefano Zampini PetscFunctionBegin; 22214222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22227a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22237a3c3d58SStefano Zampini if (!cisdense) { 22247a3c3d58SStefano Zampini PetscBool flg; 22257a3c3d58SStefano Zampini 2226ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22274222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22287a3c3d58SStefano Zampini } 222918992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 223069f65d41SStefano Zampini PetscFunctionReturn(0); 223169f65d41SStefano Zampini } 223269f65d41SStefano Zampini 223369f65d41SStefano Zampini PetscErrorCode MatMatTransposeMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 223469f65d41SStefano Zampini { 223569f65d41SStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 223669f65d41SStefano Zampini Mat_SeqDense *b = (Mat_SeqDense*)B->data; 223769f65d41SStefano Zampini Mat_SeqDense *c = (Mat_SeqDense*)C->data; 223869f65d41SStefano Zampini PetscBLASInt m,n,k; 223969f65d41SStefano Zampini PetscScalar _DOne=1.0,_DZero=0.0; 224069f65d41SStefano Zampini PetscErrorCode ierr; 224169f65d41SStefano Zampini 224269f65d41SStefano Zampini PetscFunctionBegin; 224349d0e964SStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 224449d0e964SStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 224569f65d41SStefano Zampini ierr = PetscBLASIntCast(A->cmap->n,&k);CHKERRQ(ierr); 224649d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 224769f65d41SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("N","T",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2248ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 224969f65d41SStefano Zampini PetscFunctionReturn(0); 225069f65d41SStefano Zampini } 225169f65d41SStefano Zampini 22524222ddf1SHong Zhang PetscErrorCode MatTransposeMatMultSymbolic_SeqDense_SeqDense(Mat A,Mat B,PetscReal fill,Mat C) 2253a9fe9ddaSSatish Balay { 2254ee16a9a1SHong Zhang PetscErrorCode ierr; 2255d0f46423SBarry Smith PetscInt m=A->cmap->n,n=B->cmap->n; 22567a3c3d58SStefano Zampini PetscBool cisdense; 2257a9fe9ddaSSatish Balay 2258ee16a9a1SHong Zhang PetscFunctionBegin; 22594222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 22607a3c3d58SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 22617a3c3d58SStefano Zampini if (!cisdense) { 22627a3c3d58SStefano Zampini PetscBool flg; 22637a3c3d58SStefano Zampini 2264ca15aa20SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)B,((PetscObject)A)->type_name,&flg);CHKERRQ(ierr); 22654222ddf1SHong Zhang ierr = MatSetType(C,flg ? ((PetscObject)A)->type_name : MATDENSE);CHKERRQ(ierr); 22667a3c3d58SStefano Zampini } 226718992e5dSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 2268ee16a9a1SHong Zhang PetscFunctionReturn(0); 2269ee16a9a1SHong Zhang } 2270a9fe9ddaSSatish Balay 227175648e8dSHong Zhang PetscErrorCode MatTransposeMatMultNumeric_SeqDense_SeqDense(Mat A,Mat B,Mat C) 2272a9fe9ddaSSatish Balay { 2273a9fe9ddaSSatish Balay Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2274a9fe9ddaSSatish Balay Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2275a9fe9ddaSSatish Balay Mat_SeqDense *c = (Mat_SeqDense*)C->data; 22760805154bSBarry Smith PetscBLASInt m,n,k; 2277a9fe9ddaSSatish Balay PetscScalar _DOne=1.0,_DZero=0.0; 2278c5df96a5SBarry Smith PetscErrorCode ierr; 2279a9fe9ddaSSatish Balay 2280a9fe9ddaSSatish Balay PetscFunctionBegin; 22818208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->rmap->n,&m);CHKERRQ(ierr); 22828208b9aeSStefano Zampini ierr = PetscBLASIntCast(C->cmap->n,&n);CHKERRQ(ierr); 2283c5df96a5SBarry Smith ierr = PetscBLASIntCast(A->rmap->n,&k);CHKERRQ(ierr); 228449d0e964SStefano Zampini if (!m || !n || !k) PetscFunctionReturn(0); 22855ca1cc5dSStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_("T","N",&m,&n,&k,&_DOne,a->v,&a->lda,b->v,&b->lda,&_DZero,c->v,&c->lda)); 2286ca15aa20SStefano Zampini ierr = PetscLogFlops(1.0*m*n*k + 1.0*m*n*(k-1));CHKERRQ(ierr); 2287a9fe9ddaSSatish Balay PetscFunctionReturn(0); 2288a9fe9ddaSSatish Balay } 2289985db425SBarry Smith 22904222ddf1SHong Zhang /* ----------------------------------------------- */ 22914222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AB(Mat C) 22924222ddf1SHong Zhang { 22934222ddf1SHong Zhang PetscFunctionBegin; 22944222ddf1SHong Zhang C->ops->matmultsymbolic = MatMatMultSymbolic_SeqDense_SeqDense; 22954222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AB; 22964222ddf1SHong Zhang /* dense mat may not call MatProductSymbolic(), thus set C->ops->productnumeric here */ 22974222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AB; 22984222ddf1SHong Zhang PetscFunctionReturn(0); 22994222ddf1SHong Zhang } 23004222ddf1SHong Zhang 23014222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_AtB(Mat C) 23024222ddf1SHong Zhang { 23034222ddf1SHong Zhang PetscFunctionBegin; 23044222ddf1SHong Zhang C->ops->transposematmultsymbolic = MatTransposeMatMultSymbolic_SeqDense_SeqDense; 23054222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_AtB; 23064222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_AtB; 23074222ddf1SHong Zhang PetscFunctionReturn(0); 23084222ddf1SHong Zhang } 23094222ddf1SHong Zhang 23104222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_ABt(Mat C) 23114222ddf1SHong Zhang { 23124222ddf1SHong Zhang PetscFunctionBegin; 23134222ddf1SHong Zhang C->ops->mattransposemultsymbolic = MatMatTransposeMultSymbolic_SeqDense_SeqDense; 23144222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_ABt; 23154222ddf1SHong Zhang C->ops->productnumeric = MatProductNumeric_ABt; 23164222ddf1SHong Zhang PetscFunctionReturn(0); 23174222ddf1SHong Zhang } 23184222ddf1SHong Zhang 23194222ddf1SHong Zhang static PetscErrorCode MatProductSetFromOptions_SeqDense_PtAP(Mat C) 23204222ddf1SHong Zhang { 23214222ddf1SHong Zhang PetscFunctionBegin; 23224222ddf1SHong Zhang C->ops->productsymbolic = MatProductSymbolic_Basic; 23234222ddf1SHong Zhang PetscFunctionReturn(0); 23244222ddf1SHong Zhang } 23254222ddf1SHong Zhang 23264222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqDense(Mat C) 23274222ddf1SHong Zhang { 23284222ddf1SHong Zhang PetscErrorCode ierr; 23294222ddf1SHong Zhang Mat_Product *product = C->product; 23304222ddf1SHong Zhang 23314222ddf1SHong Zhang PetscFunctionBegin; 23324222ddf1SHong Zhang switch (product->type) { 23334222ddf1SHong Zhang case MATPRODUCT_AB: 23344222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AB(C);CHKERRQ(ierr); 23354222ddf1SHong Zhang break; 23364222ddf1SHong Zhang case MATPRODUCT_AtB: 23374222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_AtB(C);CHKERRQ(ierr); 23384222ddf1SHong Zhang break; 23394222ddf1SHong Zhang case MATPRODUCT_ABt: 23404222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_ABt(C);CHKERRQ(ierr); 23414222ddf1SHong Zhang break; 23424222ddf1SHong Zhang case MATPRODUCT_PtAP: 23435aae2c7aSStefano Zampini case MATPRODUCT_RARt: 23444222ddf1SHong Zhang ierr = MatProductSetFromOptions_SeqDense_PtAP(C);CHKERRQ(ierr); 23454222ddf1SHong Zhang break; 2346544a5e07SHong Zhang default: SETERRQ1(PetscObjectComm((PetscObject)C),PETSC_ERR_SUP,"MatProduct type %s is not supported for SeqDense and SeqDense matrices",MatProductTypes[product->type]); 23474222ddf1SHong Zhang } 23484222ddf1SHong Zhang PetscFunctionReturn(0); 23494222ddf1SHong Zhang } 23504222ddf1SHong Zhang /* ----------------------------------------------- */ 23514222ddf1SHong Zhang 2352e0877f53SBarry Smith static PetscErrorCode MatGetRowMax_SeqDense(Mat A,Vec v,PetscInt idx[]) 2353985db425SBarry Smith { 2354985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2355985db425SBarry Smith PetscErrorCode ierr; 2356d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2357985db425SBarry Smith PetscScalar *x; 2358ca15aa20SStefano Zampini const PetscScalar *aa; 2359985db425SBarry Smith 2360985db425SBarry Smith PetscFunctionBegin; 2361e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2362985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2363985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2364ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2365e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2366985db425SBarry Smith for (i=0; i<m; i++) { 2367985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2368985db425SBarry Smith for (j=1; j<n; j++) { 2369ca15aa20SStefano Zampini if (PetscRealPart(x[i]) < PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2370985db425SBarry Smith } 2371985db425SBarry Smith } 2372ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2373985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2374985db425SBarry Smith PetscFunctionReturn(0); 2375985db425SBarry Smith } 2376985db425SBarry Smith 2377e0877f53SBarry Smith static PetscErrorCode MatGetRowMaxAbs_SeqDense(Mat A,Vec v,PetscInt idx[]) 2378985db425SBarry Smith { 2379985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2380985db425SBarry Smith PetscErrorCode ierr; 2381d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2382985db425SBarry Smith PetscScalar *x; 2383985db425SBarry Smith PetscReal atmp; 2384ca15aa20SStefano Zampini const PetscScalar *aa; 2385985db425SBarry Smith 2386985db425SBarry Smith PetscFunctionBegin; 2387e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2388985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2389985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2390ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2391e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2392985db425SBarry Smith for (i=0; i<m; i++) { 23939189402eSHong Zhang x[i] = PetscAbsScalar(aa[i]); 2394985db425SBarry Smith for (j=1; j<n; j++) { 2395ca15aa20SStefano Zampini atmp = PetscAbsScalar(aa[i+a->lda*j]); 2396985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = j;} 2397985db425SBarry Smith } 2398985db425SBarry Smith } 2399ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2400985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2401985db425SBarry Smith PetscFunctionReturn(0); 2402985db425SBarry Smith } 2403985db425SBarry Smith 2404e0877f53SBarry Smith static PetscErrorCode MatGetRowMin_SeqDense(Mat A,Vec v,PetscInt idx[]) 2405985db425SBarry Smith { 2406985db425SBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2407985db425SBarry Smith PetscErrorCode ierr; 2408d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,p; 2409985db425SBarry Smith PetscScalar *x; 2410ca15aa20SStefano Zampini const PetscScalar *aa; 2411985db425SBarry Smith 2412985db425SBarry Smith PetscFunctionBegin; 2413e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2414ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 2415985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2416985db425SBarry Smith ierr = VecGetLocalSize(v,&p);CHKERRQ(ierr); 2417e32f2f54SBarry Smith if (p != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 2418985db425SBarry Smith for (i=0; i<m; i++) { 2419985db425SBarry Smith x[i] = aa[i]; if (idx) idx[i] = 0; 2420985db425SBarry Smith for (j=1; j<n; j++) { 2421ca15aa20SStefano Zampini if (PetscRealPart(x[i]) > PetscRealPart(aa[i+a->lda*j])) {x[i] = aa[i + a->lda*j]; if (idx) idx[i] = j;} 2422985db425SBarry Smith } 2423985db425SBarry Smith } 2424985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2425ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 2426985db425SBarry Smith PetscFunctionReturn(0); 2427985db425SBarry Smith } 2428985db425SBarry Smith 2429637a0070SStefano Zampini PetscErrorCode MatGetColumnVector_SeqDense(Mat A,Vec v,PetscInt col) 24308d0534beSBarry Smith { 24318d0534beSBarry Smith Mat_SeqDense *a = (Mat_SeqDense*)A->data; 24328d0534beSBarry Smith PetscErrorCode ierr; 24338d0534beSBarry Smith PetscScalar *x; 2434ca15aa20SStefano Zampini const PetscScalar *aa; 24358d0534beSBarry Smith 24368d0534beSBarry Smith PetscFunctionBegin; 2437e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2438ca15aa20SStefano Zampini ierr = MatDenseGetArrayRead(A,&aa);CHKERRQ(ierr); 24398d0534beSBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 2440ca15aa20SStefano Zampini ierr = PetscArraycpy(x,aa+col*a->lda,A->rmap->n);CHKERRQ(ierr); 24418d0534beSBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 2442ca15aa20SStefano Zampini ierr = MatDenseRestoreArrayRead(A,&aa);CHKERRQ(ierr); 24438d0534beSBarry Smith PetscFunctionReturn(0); 24448d0534beSBarry Smith } 24458d0534beSBarry Smith 244652c5f739Sprj- PETSC_INTERN PetscErrorCode MatGetColumnNorms_SeqDense(Mat A,NormType type,PetscReal *norms) 24470716a85fSBarry Smith { 24480716a85fSBarry Smith PetscErrorCode ierr; 24490716a85fSBarry Smith PetscInt i,j,m,n; 24501683a169SBarry Smith const PetscScalar *a; 24510716a85fSBarry Smith 24520716a85fSBarry Smith PetscFunctionBegin; 24530716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 2454580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 24551683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&a);CHKERRQ(ierr); 24560716a85fSBarry Smith if (type == NORM_2) { 24570716a85fSBarry Smith for (i=0; i<n; i++) { 24580716a85fSBarry Smith for (j=0; j<m; j++) { 24590716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]*a[j]); 24600716a85fSBarry Smith } 24610716a85fSBarry Smith a += m; 24620716a85fSBarry Smith } 24630716a85fSBarry Smith } else if (type == NORM_1) { 24640716a85fSBarry Smith for (i=0; i<n; i++) { 24650716a85fSBarry Smith for (j=0; j<m; j++) { 24660716a85fSBarry Smith norms[i] += PetscAbsScalar(a[j]); 24670716a85fSBarry Smith } 24680716a85fSBarry Smith a += m; 24690716a85fSBarry Smith } 24700716a85fSBarry Smith } else if (type == NORM_INFINITY) { 24710716a85fSBarry Smith for (i=0; i<n; i++) { 24720716a85fSBarry Smith for (j=0; j<m; j++) { 24730716a85fSBarry Smith norms[i] = PetscMax(PetscAbsScalar(a[j]),norms[i]); 24740716a85fSBarry Smith } 24750716a85fSBarry Smith a += m; 24760716a85fSBarry Smith } 2477ce94432eSBarry Smith } else SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Unknown NormType"); 24781683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&a);CHKERRQ(ierr); 24790716a85fSBarry Smith if (type == NORM_2) { 24808f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 24810716a85fSBarry Smith } 24820716a85fSBarry Smith PetscFunctionReturn(0); 24830716a85fSBarry Smith } 24840716a85fSBarry Smith 248573a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqDense(Mat x,PetscRandom rctx) 248673a71a0fSBarry Smith { 248773a71a0fSBarry Smith PetscErrorCode ierr; 248873a71a0fSBarry Smith PetscScalar *a; 2489637a0070SStefano Zampini PetscInt lda,m,n,i,j; 249073a71a0fSBarry Smith 249173a71a0fSBarry Smith PetscFunctionBegin; 249273a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 2493637a0070SStefano Zampini ierr = MatDenseGetLDA(x,&lda);CHKERRQ(ierr); 24948c778c55SBarry Smith ierr = MatDenseGetArray(x,&a);CHKERRQ(ierr); 2495637a0070SStefano Zampini for (j=0; j<n; j++) { 2496637a0070SStefano Zampini for (i=0; i<m; i++) { 2497637a0070SStefano Zampini ierr = PetscRandomGetValue(rctx,a+j*lda+i);CHKERRQ(ierr); 2498637a0070SStefano Zampini } 249973a71a0fSBarry Smith } 25008c778c55SBarry Smith ierr = MatDenseRestoreArray(x,&a);CHKERRQ(ierr); 250173a71a0fSBarry Smith PetscFunctionReturn(0); 250273a71a0fSBarry Smith } 250373a71a0fSBarry Smith 25043b49f96aSBarry Smith static PetscErrorCode MatMissingDiagonal_SeqDense(Mat A,PetscBool *missing,PetscInt *d) 25053b49f96aSBarry Smith { 25063b49f96aSBarry Smith PetscFunctionBegin; 25073b49f96aSBarry Smith *missing = PETSC_FALSE; 25083b49f96aSBarry Smith PetscFunctionReturn(0); 25093b49f96aSBarry Smith } 251073a71a0fSBarry Smith 2511ca15aa20SStefano Zampini /* vals is not const */ 2512af53bab2SHong Zhang static PetscErrorCode MatDenseGetColumn_SeqDense(Mat A,PetscInt col,PetscScalar **vals) 251386aefd0dSHong Zhang { 2514ca15aa20SStefano Zampini PetscErrorCode ierr; 251586aefd0dSHong Zhang Mat_SeqDense *a = (Mat_SeqDense*)A->data; 2516ca15aa20SStefano Zampini PetscScalar *v; 251786aefd0dSHong Zhang 251886aefd0dSHong Zhang PetscFunctionBegin; 251986aefd0dSHong Zhang if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 2520ca15aa20SStefano Zampini ierr = MatDenseGetArray(A,&v);CHKERRQ(ierr); 2521ca15aa20SStefano Zampini *vals = v+col*a->lda; 2522ca15aa20SStefano Zampini ierr = MatDenseRestoreArray(A,&v);CHKERRQ(ierr); 252386aefd0dSHong Zhang PetscFunctionReturn(0); 252486aefd0dSHong Zhang } 252586aefd0dSHong Zhang 2526af53bab2SHong Zhang static PetscErrorCode MatDenseRestoreColumn_SeqDense(Mat A,PetscScalar **vals) 252786aefd0dSHong Zhang { 252886aefd0dSHong Zhang PetscFunctionBegin; 252986aefd0dSHong Zhang *vals = 0; /* user cannot accidently use the array later */ 253086aefd0dSHong Zhang PetscFunctionReturn(0); 253186aefd0dSHong Zhang } 2532abc3b08eSStefano Zampini 2533289bc588SBarry Smith /* -------------------------------------------------------------------*/ 2534a5ae1ecdSBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqDense, 2535905e6a2fSBarry Smith MatGetRow_SeqDense, 2536905e6a2fSBarry Smith MatRestoreRow_SeqDense, 2537905e6a2fSBarry Smith MatMult_SeqDense, 253897304618SKris Buschelman /* 4*/ MatMultAdd_SeqDense, 25397c922b88SBarry Smith MatMultTranspose_SeqDense, 25407c922b88SBarry Smith MatMultTransposeAdd_SeqDense, 2541db4efbfdSBarry Smith 0, 2542db4efbfdSBarry Smith 0, 2543db4efbfdSBarry Smith 0, 2544db4efbfdSBarry Smith /* 10*/ 0, 2545905e6a2fSBarry Smith MatLUFactor_SeqDense, 2546905e6a2fSBarry Smith MatCholeskyFactor_SeqDense, 254741f059aeSBarry Smith MatSOR_SeqDense, 2548ec8511deSBarry Smith MatTranspose_SeqDense, 254997304618SKris Buschelman /* 15*/ MatGetInfo_SeqDense, 2550905e6a2fSBarry Smith MatEqual_SeqDense, 2551905e6a2fSBarry Smith MatGetDiagonal_SeqDense, 2552905e6a2fSBarry Smith MatDiagonalScale_SeqDense, 2553905e6a2fSBarry Smith MatNorm_SeqDense, 2554c0aa2d19SHong Zhang /* 20*/ MatAssemblyBegin_SeqDense, 2555c0aa2d19SHong Zhang MatAssemblyEnd_SeqDense, 2556905e6a2fSBarry Smith MatSetOption_SeqDense, 2557905e6a2fSBarry Smith MatZeroEntries_SeqDense, 2558d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqDense, 2559db4efbfdSBarry Smith 0, 2560db4efbfdSBarry Smith 0, 2561db4efbfdSBarry Smith 0, 2562db4efbfdSBarry Smith 0, 25634994cf47SJed Brown /* 29*/ MatSetUp_SeqDense, 2564273d9f13SBarry Smith 0, 2565905e6a2fSBarry Smith 0, 256673a71a0fSBarry Smith 0, 256773a71a0fSBarry Smith 0, 2568d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqDense, 2569a5ae1ecdSBarry Smith 0, 2570a5ae1ecdSBarry Smith 0, 2571a5ae1ecdSBarry Smith 0, 2572a5ae1ecdSBarry Smith 0, 2573d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqDense, 25747dae84e0SHong Zhang MatCreateSubMatrices_SeqDense, 2575a5ae1ecdSBarry Smith 0, 25764b0e389bSBarry Smith MatGetValues_SeqDense, 2577a5ae1ecdSBarry Smith MatCopy_SeqDense, 2578d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqDense, 2579a5ae1ecdSBarry Smith MatScale_SeqDense, 25807d68702bSBarry Smith MatShift_Basic, 2581a5ae1ecdSBarry Smith 0, 25823f49a652SStefano Zampini MatZeroRowsColumns_SeqDense, 258373a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqDense, 2584a5ae1ecdSBarry Smith 0, 2585a5ae1ecdSBarry Smith 0, 2586a5ae1ecdSBarry Smith 0, 2587a5ae1ecdSBarry Smith 0, 2588d519adbfSMatthew Knepley /* 54*/ 0, 2589a5ae1ecdSBarry Smith 0, 2590a5ae1ecdSBarry Smith 0, 2591a5ae1ecdSBarry Smith 0, 2592a5ae1ecdSBarry Smith 0, 2593d519adbfSMatthew Knepley /* 59*/ 0, 2594e03a110bSBarry Smith MatDestroy_SeqDense, 2595e03a110bSBarry Smith MatView_SeqDense, 2596357abbc8SBarry Smith 0, 259797304618SKris Buschelman 0, 2598d519adbfSMatthew Knepley /* 64*/ 0, 259997304618SKris Buschelman 0, 260097304618SKris Buschelman 0, 260197304618SKris Buschelman 0, 260297304618SKris Buschelman 0, 2603d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqDense, 260497304618SKris Buschelman 0, 260597304618SKris Buschelman 0, 260697304618SKris Buschelman 0, 260797304618SKris Buschelman 0, 2608d519adbfSMatthew Knepley /* 74*/ 0, 260997304618SKris Buschelman 0, 261097304618SKris Buschelman 0, 261197304618SKris Buschelman 0, 261297304618SKris Buschelman 0, 2613d519adbfSMatthew Knepley /* 79*/ 0, 261497304618SKris Buschelman 0, 261597304618SKris Buschelman 0, 261697304618SKris Buschelman 0, 26175bba2384SShri Abhyankar /* 83*/ MatLoad_SeqDense, 2618637a0070SStefano Zampini MatIsSymmetric_SeqDense, 26191cbb95d3SBarry Smith MatIsHermitian_SeqDense, 2620865e5f61SKris Buschelman 0, 2621865e5f61SKris Buschelman 0, 2622865e5f61SKris Buschelman 0, 26234222ddf1SHong Zhang /* 89*/ 0, 26244222ddf1SHong Zhang 0, 2625a9fe9ddaSSatish Balay MatMatMultNumeric_SeqDense_SeqDense, 26264222ddf1SHong Zhang 0, 26274222ddf1SHong Zhang 0, 26284222ddf1SHong Zhang /* 94*/ 0, 26294222ddf1SHong Zhang 0, 26304222ddf1SHong Zhang 0, 263169f65d41SStefano Zampini MatMatTransposeMultNumeric_SeqDense_SeqDense, 2632284134d9SBarry Smith 0, 26334222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqDense, 2634284134d9SBarry Smith 0, 2635284134d9SBarry Smith 0, 2636ba337c44SJed Brown MatConjugate_SeqDense, 2637f73d5cc4SBarry Smith 0, 2638ba337c44SJed Brown /*104*/ 0, 2639ba337c44SJed Brown MatRealPart_SeqDense, 2640ba337c44SJed Brown MatImaginaryPart_SeqDense, 2641985db425SBarry Smith 0, 2642985db425SBarry Smith 0, 26438208b9aeSStefano Zampini /*109*/ 0, 2644985db425SBarry Smith 0, 26458d0534beSBarry Smith MatGetRowMin_SeqDense, 2646aabbc4fbSShri Abhyankar MatGetColumnVector_SeqDense, 26473b49f96aSBarry Smith MatMissingDiagonal_SeqDense, 2648aabbc4fbSShri Abhyankar /*114*/ 0, 2649aabbc4fbSShri Abhyankar 0, 2650aabbc4fbSShri Abhyankar 0, 2651aabbc4fbSShri Abhyankar 0, 2652aabbc4fbSShri Abhyankar 0, 2653aabbc4fbSShri Abhyankar /*119*/ 0, 2654aabbc4fbSShri Abhyankar 0, 2655aabbc4fbSShri Abhyankar 0, 26560716a85fSBarry Smith 0, 26570716a85fSBarry Smith 0, 26580716a85fSBarry Smith /*124*/ 0, 26595df89d91SHong Zhang MatGetColumnNorms_SeqDense, 26605df89d91SHong Zhang 0, 26615df89d91SHong Zhang 0, 26625df89d91SHong Zhang 0, 26635df89d91SHong Zhang /*129*/ 0, 26644222ddf1SHong Zhang 0, 26654222ddf1SHong Zhang 0, 266675648e8dSHong Zhang MatTransposeMatMultNumeric_SeqDense_SeqDense, 26673964eb88SJed Brown 0, 26683964eb88SJed Brown /*134*/ 0, 26693964eb88SJed Brown 0, 26703964eb88SJed Brown 0, 26713964eb88SJed Brown 0, 26723964eb88SJed Brown 0, 26733964eb88SJed Brown /*139*/ 0, 2674f9426fe0SMark Adams 0, 2675d528f656SJakub Kruzik 0, 2676d528f656SJakub Kruzik 0, 2677d528f656SJakub Kruzik 0, 26784222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqDense, 26794222ddf1SHong Zhang /*145*/ 0, 26804222ddf1SHong Zhang 0, 26814222ddf1SHong Zhang 0 2682985db425SBarry Smith }; 268390ace30eSBarry Smith 26844b828684SBarry Smith /*@C 2685fafbff53SBarry Smith MatCreateSeqDense - Creates a sequential dense matrix that 2686d65003e9SLois Curfman McInnes is stored in column major order (the usual Fortran 77 manner). Many 2687d65003e9SLois Curfman McInnes of the matrix operations use the BLAS and LAPACK routines. 2688289bc588SBarry Smith 2689d083f849SBarry Smith Collective 2690db81eaa0SLois Curfman McInnes 269120563c6bSBarry Smith Input Parameters: 2692db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 26930c775827SLois Curfman McInnes . m - number of rows 269418f449edSLois Curfman McInnes . n - number of columns 26950298fd71SBarry Smith - data - optional location of matrix data in column major order. Set data=NULL for PETSc 2696dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 269720563c6bSBarry Smith 269820563c6bSBarry Smith Output Parameter: 269944cd7ae7SLois Curfman McInnes . A - the matrix 270020563c6bSBarry Smith 2701b259b22eSLois Curfman McInnes Notes: 270218f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 270318f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 27040298fd71SBarry Smith set data=NULL. 270518f449edSLois Curfman McInnes 2706027ccd11SLois Curfman McInnes Level: intermediate 2707027ccd11SLois Curfman McInnes 270869b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues() 270920563c6bSBarry Smith @*/ 27107087cfbeSBarry Smith PetscErrorCode MatCreateSeqDense(MPI_Comm comm,PetscInt m,PetscInt n,PetscScalar *data,Mat *A) 2711289bc588SBarry Smith { 2712dfbe8321SBarry Smith PetscErrorCode ierr; 27133b2fbd54SBarry Smith 27143a40ed3dSBarry Smith PetscFunctionBegin; 2715f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 2716f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 2717273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 2718273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 2719273d9f13SBarry Smith PetscFunctionReturn(0); 2720273d9f13SBarry Smith } 2721273d9f13SBarry Smith 2722273d9f13SBarry Smith /*@C 2723273d9f13SBarry Smith MatSeqDenseSetPreallocation - Sets the array used for storing the matrix elements 2724273d9f13SBarry Smith 2725d083f849SBarry Smith Collective 2726273d9f13SBarry Smith 2727273d9f13SBarry Smith Input Parameters: 27281c4f3114SJed Brown + B - the matrix 27290298fd71SBarry Smith - data - the array (or NULL) 2730273d9f13SBarry Smith 2731273d9f13SBarry Smith Notes: 2732273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 2733273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 2734284134d9SBarry Smith need not call this routine. 2735273d9f13SBarry Smith 2736273d9f13SBarry Smith Level: intermediate 2737273d9f13SBarry Smith 273869b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateDense(), MatSetValues(), MatSeqDenseSetLDA() 2739867c911aSBarry Smith 2740273d9f13SBarry Smith @*/ 27417087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation(Mat B,PetscScalar data[]) 2742273d9f13SBarry Smith { 27434ac538c5SBarry Smith PetscErrorCode ierr; 2744a23d5eceSKris Buschelman 2745a23d5eceSKris Buschelman PetscFunctionBegin; 2746d5ea218eSStefano Zampini PetscValidHeaderSpecific(B,MAT_CLASSID,1); 27474ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqDenseSetPreallocation_C",(Mat,PetscScalar[]),(B,data));CHKERRQ(ierr); 2748a23d5eceSKris Buschelman PetscFunctionReturn(0); 2749a23d5eceSKris Buschelman } 2750a23d5eceSKris Buschelman 27517087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetPreallocation_SeqDense(Mat B,PetscScalar *data) 2752a23d5eceSKris Buschelman { 2753273d9f13SBarry Smith Mat_SeqDense *b; 2754dfbe8321SBarry Smith PetscErrorCode ierr; 2755273d9f13SBarry Smith 2756273d9f13SBarry Smith PetscFunctionBegin; 2757273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 2758a868139aSShri Abhyankar 275934ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 276034ef9618SShri Abhyankar ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 276134ef9618SShri Abhyankar 2762273d9f13SBarry Smith b = (Mat_SeqDense*)B->data; 276386d161a7SShri Abhyankar b->Mmax = B->rmap->n; 276486d161a7SShri Abhyankar b->Nmax = B->cmap->n; 276586d161a7SShri Abhyankar if (b->lda <= 0 || b->changelda) b->lda = B->rmap->n; 276686d161a7SShri Abhyankar 2767220afb94SBarry Smith ierr = PetscIntMultError(b->lda,b->Nmax,NULL);CHKERRQ(ierr); 27689e8f95c4SLisandro Dalcin if (!data) { /* petsc-allocated storage */ 27699e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2770e92229d0SSatish Balay ierr = PetscCalloc1((size_t)b->lda*b->Nmax,&b->v);CHKERRQ(ierr); 27713bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,b->lda*b->Nmax*sizeof(PetscScalar));CHKERRQ(ierr); 27722205254eSKarl Rupp 27739e8f95c4SLisandro Dalcin b->user_alloc = PETSC_FALSE; 2774273d9f13SBarry Smith } else { /* user-allocated storage */ 27759e8f95c4SLisandro Dalcin if (!b->user_alloc) { ierr = PetscFree(b->v);CHKERRQ(ierr); } 2776273d9f13SBarry Smith b->v = data; 2777273d9f13SBarry Smith b->user_alloc = PETSC_TRUE; 2778273d9f13SBarry Smith } 27790450473dSBarry Smith B->assembled = PETSC_TRUE; 2780273d9f13SBarry Smith PetscFunctionReturn(0); 2781273d9f13SBarry Smith } 2782273d9f13SBarry Smith 278365b80a83SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2784cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqDense_Elemental(Mat A, MatType newtype,MatReuse reuse,Mat *newmat) 27858baccfbdSHong Zhang { 2786d77f618aSHong Zhang Mat mat_elemental; 2787d77f618aSHong Zhang PetscErrorCode ierr; 27881683a169SBarry Smith const PetscScalar *array; 27891683a169SBarry Smith PetscScalar *v_colwise; 2790d77f618aSHong Zhang PetscInt M=A->rmap->N,N=A->cmap->N,i,j,k,*rows,*cols; 2791d77f618aSHong Zhang 27928baccfbdSHong Zhang PetscFunctionBegin; 2793d77f618aSHong Zhang ierr = PetscMalloc3(M*N,&v_colwise,M,&rows,N,&cols);CHKERRQ(ierr); 27941683a169SBarry Smith ierr = MatDenseGetArrayRead(A,&array);CHKERRQ(ierr); 2795d77f618aSHong Zhang /* convert column-wise array into row-wise v_colwise, see MatSetValues_Elemental() */ 2796d77f618aSHong Zhang k = 0; 2797d77f618aSHong Zhang for (j=0; j<N; j++) { 2798d77f618aSHong Zhang cols[j] = j; 2799d77f618aSHong Zhang for (i=0; i<M; i++) { 2800d77f618aSHong Zhang v_colwise[j*M+i] = array[k++]; 2801d77f618aSHong Zhang } 2802d77f618aSHong Zhang } 2803d77f618aSHong Zhang for (i=0; i<M; i++) { 2804d77f618aSHong Zhang rows[i] = i; 2805d77f618aSHong Zhang } 28061683a169SBarry Smith ierr = MatDenseRestoreArrayRead(A,&array);CHKERRQ(ierr); 2807d77f618aSHong Zhang 2808d77f618aSHong Zhang ierr = MatCreate(PetscObjectComm((PetscObject)A), &mat_elemental);CHKERRQ(ierr); 2809d77f618aSHong Zhang ierr = MatSetSizes(mat_elemental,PETSC_DECIDE,PETSC_DECIDE,M,N);CHKERRQ(ierr); 2810d77f618aSHong Zhang ierr = MatSetType(mat_elemental,MATELEMENTAL);CHKERRQ(ierr); 2811d77f618aSHong Zhang ierr = MatSetUp(mat_elemental);CHKERRQ(ierr); 2812d77f618aSHong Zhang 2813d77f618aSHong Zhang /* PETSc-Elemental interaface uses axpy for setting off-processor entries, only ADD_VALUES is allowed */ 2814d77f618aSHong Zhang ierr = MatSetValues(mat_elemental,M,rows,N,cols,v_colwise,ADD_VALUES);CHKERRQ(ierr); 2815d77f618aSHong Zhang ierr = MatAssemblyBegin(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2816d77f618aSHong Zhang ierr = MatAssemblyEnd(mat_elemental, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2817d77f618aSHong Zhang ierr = PetscFree3(v_colwise,rows,cols);CHKERRQ(ierr); 2818d77f618aSHong Zhang 2819511c6705SHong Zhang if (reuse == MAT_INPLACE_MATRIX) { 282028be2f97SBarry Smith ierr = MatHeaderReplace(A,&mat_elemental);CHKERRQ(ierr); 2821d77f618aSHong Zhang } else { 2822d77f618aSHong Zhang *newmat = mat_elemental; 2823d77f618aSHong Zhang } 28248baccfbdSHong Zhang PetscFunctionReturn(0); 28258baccfbdSHong Zhang } 282665b80a83SHong Zhang #endif 28278baccfbdSHong Zhang 28281b807ce4Svictorle /*@C 28291b807ce4Svictorle MatSeqDenseSetLDA - Declare the leading dimension of the user-provided array 28301b807ce4Svictorle 28311b807ce4Svictorle Input parameter: 28321b807ce4Svictorle + A - the matrix 28331b807ce4Svictorle - lda - the leading dimension 28341b807ce4Svictorle 28351b807ce4Svictorle Notes: 2836867c911aSBarry Smith This routine is to be used in conjunction with MatSeqDenseSetPreallocation(); 28371b807ce4Svictorle it asserts that the preallocation has a leading dimension (the LDA parameter 28381b807ce4Svictorle of Blas and Lapack fame) larger than M, the first dimension of the matrix. 28391b807ce4Svictorle 28401b807ce4Svictorle Level: intermediate 28411b807ce4Svictorle 2842284134d9SBarry Smith .seealso: MatCreate(), MatCreateSeqDense(), MatSeqDenseSetPreallocation(), MatSetMaximumSize() 2843867c911aSBarry Smith 28441b807ce4Svictorle @*/ 28457087cfbeSBarry Smith PetscErrorCode MatSeqDenseSetLDA(Mat B,PetscInt lda) 28461b807ce4Svictorle { 28471b807ce4Svictorle Mat_SeqDense *b = (Mat_SeqDense*)B->data; 2848d5ea218eSStefano Zampini PetscBool flg; 2849d5ea218eSStefano Zampini PetscErrorCode ierr; 285021a2c019SBarry Smith 28511b807ce4Svictorle PetscFunctionBegin; 2852d5ea218eSStefano Zampini PetscValidHeaderSpecific(B,MAT_CLASSID,1); 2853d5ea218eSStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 2854d5ea218eSStefano Zampini if (!flg) PetscFunctionReturn(0); 2855e32f2f54SBarry Smith if (lda < B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"LDA %D must be at least matrix dimension %D",lda,B->rmap->n); 28561b807ce4Svictorle b->lda = lda; 285721a2c019SBarry Smith b->changelda = PETSC_FALSE; 285821a2c019SBarry Smith b->Mmax = PetscMax(b->Mmax,lda); 28591b807ce4Svictorle PetscFunctionReturn(0); 28601b807ce4Svictorle } 28611b807ce4Svictorle 2862d528f656SJakub Kruzik PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqDense(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 2863d528f656SJakub Kruzik { 2864d528f656SJakub Kruzik PetscErrorCode ierr; 2865d528f656SJakub Kruzik PetscMPIInt size; 2866d528f656SJakub Kruzik 2867d528f656SJakub Kruzik PetscFunctionBegin; 2868d528f656SJakub Kruzik ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 2869d528f656SJakub Kruzik if (size == 1) { 2870d528f656SJakub Kruzik if (scall == MAT_INITIAL_MATRIX) { 2871d528f656SJakub Kruzik ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 2872d528f656SJakub Kruzik } else { 2873d528f656SJakub Kruzik ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2874d528f656SJakub Kruzik } 2875d528f656SJakub Kruzik } else { 2876d528f656SJakub Kruzik ierr = MatCreateMPIMatConcatenateSeqMat_MPIDense(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 2877d528f656SJakub Kruzik } 2878d528f656SJakub Kruzik PetscFunctionReturn(0); 2879d528f656SJakub Kruzik } 2880d528f656SJakub Kruzik 28816947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28826947451fSStefano Zampini { 28836947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 28846947451fSStefano Zampini PetscErrorCode ierr; 28856947451fSStefano Zampini 28866947451fSStefano Zampini PetscFunctionBegin; 28876947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 28886947451fSStefano Zampini if (!a->cvec) { 28896947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 28906947451fSStefano Zampini } 28916947451fSStefano Zampini a->vecinuse = col + 1; 28926947451fSStefano Zampini ierr = MatDenseGetArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 28936947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 28946947451fSStefano Zampini *v = a->cvec; 28956947451fSStefano Zampini PetscFunctionReturn(0); 28966947451fSStefano Zampini } 28976947451fSStefano Zampini 28986947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec_SeqDense(Mat A,PetscInt col,Vec *v) 28996947451fSStefano Zampini { 29006947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29016947451fSStefano Zampini PetscErrorCode ierr; 29026947451fSStefano Zampini 29036947451fSStefano Zampini PetscFunctionBegin; 29046947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29056947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29066947451fSStefano Zampini a->vecinuse = 0; 29076947451fSStefano Zampini ierr = MatDenseRestoreArray(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29086947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29096947451fSStefano Zampini *v = NULL; 29106947451fSStefano Zampini PetscFunctionReturn(0); 29116947451fSStefano Zampini } 29126947451fSStefano Zampini 29136947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 29146947451fSStefano Zampini { 29156947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29166947451fSStefano Zampini PetscErrorCode ierr; 29176947451fSStefano Zampini 29186947451fSStefano Zampini PetscFunctionBegin; 29196947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 29206947451fSStefano Zampini if (!a->cvec) { 29216947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 29226947451fSStefano Zampini } 29236947451fSStefano Zampini a->vecinuse = col + 1; 29246947451fSStefano Zampini ierr = MatDenseGetArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 29256947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 29266947451fSStefano Zampini ierr = VecLockReadPush(a->cvec);CHKERRQ(ierr); 29276947451fSStefano Zampini *v = a->cvec; 29286947451fSStefano Zampini PetscFunctionReturn(0); 29296947451fSStefano Zampini } 29306947451fSStefano Zampini 29316947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead_SeqDense(Mat A,PetscInt col,Vec *v) 29326947451fSStefano Zampini { 29336947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29346947451fSStefano Zampini PetscErrorCode ierr; 29356947451fSStefano Zampini 29366947451fSStefano Zampini PetscFunctionBegin; 29376947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29386947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29396947451fSStefano Zampini a->vecinuse = 0; 29406947451fSStefano Zampini ierr = MatDenseRestoreArrayRead(A,&a->ptrinuse);CHKERRQ(ierr); 29416947451fSStefano Zampini ierr = VecLockReadPop(a->cvec);CHKERRQ(ierr); 29426947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29436947451fSStefano Zampini *v = NULL; 29446947451fSStefano Zampini PetscFunctionReturn(0); 29456947451fSStefano Zampini } 29466947451fSStefano Zampini 29476947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29486947451fSStefano Zampini { 29496947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29506947451fSStefano Zampini PetscErrorCode ierr; 29516947451fSStefano Zampini 29526947451fSStefano Zampini PetscFunctionBegin; 29536947451fSStefano Zampini if (a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseRestoreColumnVec first"); 29546947451fSStefano Zampini if (!a->cvec) { 29556947451fSStefano Zampini ierr = VecCreateSeqWithArray(PetscObjectComm((PetscObject)A),A->rmap->bs,A->rmap->n,NULL,&a->cvec);CHKERRQ(ierr); 29566947451fSStefano Zampini } 29576947451fSStefano Zampini a->vecinuse = col + 1; 29586947451fSStefano Zampini ierr = MatDenseGetArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29596947451fSStefano Zampini ierr = VecPlaceArray(a->cvec,a->ptrinuse + (size_t)col * (size_t)a->lda);CHKERRQ(ierr); 29606947451fSStefano Zampini *v = a->cvec; 29616947451fSStefano Zampini PetscFunctionReturn(0); 29626947451fSStefano Zampini } 29636947451fSStefano Zampini 29646947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite_SeqDense(Mat A,PetscInt col,Vec *v) 29656947451fSStefano Zampini { 29666947451fSStefano Zampini Mat_SeqDense *a = (Mat_SeqDense*)A->data; 29676947451fSStefano Zampini PetscErrorCode ierr; 29686947451fSStefano Zampini 29696947451fSStefano Zampini PetscFunctionBegin; 29706947451fSStefano Zampini if (!a->vecinuse) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Need to call MatDenseGetColumnVec first"); 29716947451fSStefano Zampini if (!a->cvec) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Missing internal column vector"); 29726947451fSStefano Zampini a->vecinuse = 0; 29736947451fSStefano Zampini ierr = MatDenseRestoreArrayWrite(A,(PetscScalar**)&a->ptrinuse);CHKERRQ(ierr); 29746947451fSStefano Zampini ierr = VecResetArray(a->cvec);CHKERRQ(ierr); 29756947451fSStefano Zampini *v = NULL; 29766947451fSStefano Zampini PetscFunctionReturn(0); 29776947451fSStefano Zampini } 29786947451fSStefano Zampini 29790bad9183SKris Buschelman /*MC 2980fafad747SKris Buschelman MATSEQDENSE - MATSEQDENSE = "seqdense" - A matrix type to be used for sequential dense matrices. 29810bad9183SKris Buschelman 29820bad9183SKris Buschelman Options Database Keys: 29830bad9183SKris Buschelman . -mat_type seqdense - sets the matrix type to "seqdense" during a call to MatSetFromOptions() 29840bad9183SKris Buschelman 29850bad9183SKris Buschelman Level: beginner 29860bad9183SKris Buschelman 298789665df3SBarry Smith .seealso: MatCreateSeqDense() 298889665df3SBarry Smith 29890bad9183SKris Buschelman M*/ 2990ca15aa20SStefano Zampini PetscErrorCode MatCreate_SeqDense(Mat B) 2991273d9f13SBarry Smith { 2992273d9f13SBarry Smith Mat_SeqDense *b; 2993dfbe8321SBarry Smith PetscErrorCode ierr; 29947c334f02SBarry Smith PetscMPIInt size; 2995273d9f13SBarry Smith 2996273d9f13SBarry Smith PetscFunctionBegin; 2997ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 2998e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 299955659b69SBarry Smith 3000b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 3001549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 300244cd7ae7SLois Curfman McInnes B->data = (void*)b; 300318f449edSLois Curfman McInnes 3004273d9f13SBarry Smith b->roworiented = PETSC_TRUE; 30054e220ebcSLois Curfman McInnes 300649a6ff4bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetLDA_C",MatDenseGetLDA_SeqDense);CHKERRQ(ierr); 3007bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArray_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 30088572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArray_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 3009d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDensePlaceArray_C",MatDensePlaceArray_SeqDense);CHKERRQ(ierr); 3010d3042a70SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseResetArray_C",MatDenseResetArray_SeqDense);CHKERRQ(ierr); 3011d5ea218eSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseReplaceArray_C",MatDenseReplaceArray_SeqDense);CHKERRQ(ierr); 30128572280aSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayRead_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 3013715b7558SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayRead_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 30146947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetArrayWrite_C",MatDenseGetArray_SeqDense);CHKERRQ(ierr); 30156947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreArrayWrite_C",MatDenseRestoreArray_SeqDense);CHKERRQ(ierr); 3016bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqaij_C",MatConvert_SeqDense_SeqAIJ);CHKERRQ(ierr); 30178baccfbdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30188baccfbdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_elemental_C",MatConvert_SeqDense_Elemental);CHKERRQ(ierr); 30198baccfbdSHong Zhang #endif 30202bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 30212bf066beSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqdense_seqdensecuda_C",MatConvert_SeqDense_SeqDenseCUDA);CHKERRQ(ierr); 30224222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 30234222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdensecuda_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 3024637a0070SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdensecuda_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 30254222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 30262bf066beSStefano Zampini #endif 3027bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqDenseSetPreallocation_C",MatSeqDenseSetPreallocation_SeqDense);CHKERRQ(ierr); 30284222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqdense_C",MatProductSetFromOptions_SeqAIJ_SeqDense);CHKERRQ(ierr); 30294222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqdense_C",MatProductSetFromOptions_SeqDense);CHKERRQ(ierr); 3030bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaij_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3031bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaij_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 30324222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 3033a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqbaij_seqdense_C",MatMatMultSymbolic_SeqBAIJ_SeqDense);CHKERRQ(ierr); 3034a001520aSPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqbaij_seqdense_C",MatMatMultNumeric_SeqBAIJ_SeqDense);CHKERRQ(ierr); 30354222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqsbaij_seqdense_C",MatProductSetFromOptions_SeqXBAIJ_SeqDense);CHKERRQ(ierr); 3036c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqsbaij_seqdense_C",MatMatMultSymbolic_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 3037c2916339SPierre Jolivet ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqsbaij_seqdense_C",MatMatMultNumeric_SeqSBAIJ_SeqDense);CHKERRQ(ierr); 30384099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijperm_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30394099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijperm_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3040e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijsell_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3041e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijsell_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 304296e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqaijmkl_seqdense_C",MatMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 304396e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqaijmkl_seqdense_C",MatMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 304452c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_nest_seqdense_C",MatMatMultSymbolic_Nest_Dense);CHKERRQ(ierr); 304552c5f739Sprj- ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_nest_seqdense_C",MatMatMultNumeric_Nest_Dense);CHKERRQ(ierr); 304696e6d5c4SRichard Tran Mills 30473bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaij_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30483bf78175SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaij_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 30494099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijperm_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 30504099cc6bSBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijperm_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3051e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijsell_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 3052e9e4f4a6SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijsell_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 305396e6d5c4SRichard Tran Mills 305496e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultSymbolic_seqaijmkl_seqdense_C",MatTransposeMatMultSymbolic_SeqAIJ_SeqDense);CHKERRQ(ierr); 305596e6d5c4SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatTransposeMatMultNumeric_seqaijmkl_seqdense_C",MatTransposeMatMultNumeric_SeqAIJ_SeqDense);CHKERRQ(ierr); 3056af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumn_C",MatDenseGetColumn_SeqDense);CHKERRQ(ierr); 3057af53bab2SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumn_C",MatDenseRestoreColumn_SeqDense);CHKERRQ(ierr); 30586947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVec_C",MatDenseGetColumnVec_SeqDense);CHKERRQ(ierr); 30596947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVec_C",MatDenseRestoreColumnVec_SeqDense);CHKERRQ(ierr); 30606947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecRead_C",MatDenseGetColumnVecRead_SeqDense);CHKERRQ(ierr); 30616947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecRead_C",MatDenseRestoreColumnVecRead_SeqDense);CHKERRQ(ierr); 30626947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseGetColumnVecWrite_C",MatDenseGetColumnVecWrite_SeqDense);CHKERRQ(ierr); 30636947451fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatDenseRestoreColumnVecWrite_C",MatDenseRestoreColumnVecWrite_SeqDense);CHKERRQ(ierr); 306417667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQDENSE);CHKERRQ(ierr); 30653a40ed3dSBarry Smith PetscFunctionReturn(0); 3066289bc588SBarry Smith } 306786aefd0dSHong Zhang 306886aefd0dSHong Zhang /*@C 3069af53bab2SHong Zhang MatDenseGetColumn - gives access to a column of a dense matrix. This is only the local part of the column. You MUST call MatDenseRestoreColumn() to avoid memory bleeding. 307086aefd0dSHong Zhang 307186aefd0dSHong Zhang Not Collective 307286aefd0dSHong Zhang 307386aefd0dSHong Zhang Input Parameter: 307486aefd0dSHong Zhang + mat - a MATSEQDENSE or MATMPIDENSE matrix 307586aefd0dSHong Zhang - col - column index 307686aefd0dSHong Zhang 307786aefd0dSHong Zhang Output Parameter: 307886aefd0dSHong Zhang . vals - pointer to the data 307986aefd0dSHong Zhang 308086aefd0dSHong Zhang Level: intermediate 308186aefd0dSHong Zhang 308286aefd0dSHong Zhang .seealso: MatDenseRestoreColumn() 308386aefd0dSHong Zhang @*/ 308486aefd0dSHong Zhang PetscErrorCode MatDenseGetColumn(Mat A,PetscInt col,PetscScalar **vals) 308586aefd0dSHong Zhang { 308686aefd0dSHong Zhang PetscErrorCode ierr; 308786aefd0dSHong Zhang 308886aefd0dSHong Zhang PetscFunctionBegin; 3089d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3090d5ea218eSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 3091d5ea218eSStefano Zampini PetscValidPointer(vals,3); 309286aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseGetColumn_C",(Mat,PetscInt,PetscScalar**),(A,col,vals));CHKERRQ(ierr); 309386aefd0dSHong Zhang PetscFunctionReturn(0); 309486aefd0dSHong Zhang } 309586aefd0dSHong Zhang 309686aefd0dSHong Zhang /*@C 309786aefd0dSHong Zhang MatDenseRestoreColumn - returns access to a column of a dense matrix which is returned by MatDenseGetColumn(). 309886aefd0dSHong Zhang 309986aefd0dSHong Zhang Not Collective 310086aefd0dSHong Zhang 310186aefd0dSHong Zhang Input Parameter: 310286aefd0dSHong Zhang . mat - a MATSEQDENSE or MATMPIDENSE matrix 310386aefd0dSHong Zhang 310486aefd0dSHong Zhang Output Parameter: 310586aefd0dSHong Zhang . vals - pointer to the data 310686aefd0dSHong Zhang 310786aefd0dSHong Zhang Level: intermediate 310886aefd0dSHong Zhang 310986aefd0dSHong Zhang .seealso: MatDenseGetColumn() 311086aefd0dSHong Zhang @*/ 311186aefd0dSHong Zhang PetscErrorCode MatDenseRestoreColumn(Mat A,PetscScalar **vals) 311286aefd0dSHong Zhang { 311386aefd0dSHong Zhang PetscErrorCode ierr; 311486aefd0dSHong Zhang 311586aefd0dSHong Zhang PetscFunctionBegin; 3116d5ea218eSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 3117d5ea218eSStefano Zampini PetscValidPointer(vals,2); 311886aefd0dSHong Zhang ierr = PetscUseMethod(A,"MatDenseRestoreColumn_C",(Mat,PetscScalar**),(A,vals));CHKERRQ(ierr); 311986aefd0dSHong Zhang PetscFunctionReturn(0); 312086aefd0dSHong Zhang } 31216947451fSStefano Zampini 31226947451fSStefano Zampini /*@C 31236947451fSStefano Zampini MatDenseGetColumnVec - Gives read-write access to a column of a dense matrix, represented as a Vec. 31246947451fSStefano Zampini 31256947451fSStefano Zampini Collective 31266947451fSStefano Zampini 31276947451fSStefano Zampini Input Parameter: 31286947451fSStefano Zampini + mat - the Mat object 31296947451fSStefano Zampini - col - the column index 31306947451fSStefano Zampini 31316947451fSStefano Zampini Output Parameter: 31326947451fSStefano Zampini . v - the vector 31336947451fSStefano Zampini 31346947451fSStefano Zampini Notes: 31356947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVec() when the vector is no longer needed. 31366947451fSStefano Zampini Use MatDenseGetColumnVecRead() to obtain read-only access or MatDenseGetColumnVecWrite() for write-only access. 31376947451fSStefano Zampini 31386947451fSStefano Zampini Level: intermediate 31396947451fSStefano Zampini 31406947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31416947451fSStefano Zampini @*/ 31426947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVec(Mat A,PetscInt col,Vec *v) 31436947451fSStefano Zampini { 31446947451fSStefano Zampini PetscErrorCode ierr; 31456947451fSStefano Zampini 31466947451fSStefano Zampini PetscFunctionBegin; 31476947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31486947451fSStefano Zampini PetscValidType(A,1); 31496947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31506947451fSStefano Zampini PetscValidPointer(v,3); 31516947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31526947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31536947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31546947451fSStefano Zampini PetscFunctionReturn(0); 31556947451fSStefano Zampini } 31566947451fSStefano Zampini 31576947451fSStefano Zampini /*@C 31586947451fSStefano Zampini MatDenseRestoreColumnVec - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVec(). 31596947451fSStefano Zampini 31606947451fSStefano Zampini Collective 31616947451fSStefano Zampini 31626947451fSStefano Zampini Input Parameter: 31636947451fSStefano Zampini + mat - the Mat object 31646947451fSStefano Zampini . col - the column index 31656947451fSStefano Zampini - v - the Vec object 31666947451fSStefano Zampini 31676947451fSStefano Zampini Level: intermediate 31686947451fSStefano Zampini 31696947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 31706947451fSStefano Zampini @*/ 31716947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVec(Mat A,PetscInt col,Vec *v) 31726947451fSStefano Zampini { 31736947451fSStefano Zampini PetscErrorCode ierr; 31746947451fSStefano Zampini 31756947451fSStefano Zampini PetscFunctionBegin; 31766947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 31776947451fSStefano Zampini PetscValidType(A,1); 31786947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 31796947451fSStefano Zampini PetscValidPointer(v,3); 31806947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 31816947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 31826947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVec_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 31836947451fSStefano Zampini PetscFunctionReturn(0); 31846947451fSStefano Zampini } 31856947451fSStefano Zampini 31866947451fSStefano Zampini /*@C 31876947451fSStefano Zampini MatDenseGetColumnVecRead - Gives read-only access to a column of a dense matrix, represented as a Vec. 31886947451fSStefano Zampini 31896947451fSStefano Zampini Collective 31906947451fSStefano Zampini 31916947451fSStefano Zampini Input Parameter: 31926947451fSStefano Zampini + mat - the Mat object 31936947451fSStefano Zampini - col - the column index 31946947451fSStefano Zampini 31956947451fSStefano Zampini Output Parameter: 31966947451fSStefano Zampini . v - the vector 31976947451fSStefano Zampini 31986947451fSStefano Zampini Notes: 31996947451fSStefano Zampini The vector is owned by PETSc and users cannot modify it. 32006947451fSStefano Zampini Users need to call MatDenseRestoreColumnVecRead() when the vector is no longer needed. 32016947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecWrite() for write-only access. 32026947451fSStefano Zampini 32036947451fSStefano Zampini Level: intermediate 32046947451fSStefano Zampini 32056947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 32066947451fSStefano Zampini @*/ 32076947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecRead(Mat A,PetscInt col,Vec *v) 32086947451fSStefano Zampini { 32096947451fSStefano Zampini PetscErrorCode ierr; 32106947451fSStefano Zampini 32116947451fSStefano Zampini PetscFunctionBegin; 32126947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32136947451fSStefano Zampini PetscValidType(A,1); 32146947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32156947451fSStefano Zampini PetscValidPointer(v,3); 32166947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32176947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32186947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32196947451fSStefano Zampini PetscFunctionReturn(0); 32206947451fSStefano Zampini } 32216947451fSStefano Zampini 32226947451fSStefano Zampini /*@C 32236947451fSStefano Zampini MatDenseRestoreColumnVecRead - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecRead(). 32246947451fSStefano Zampini 32256947451fSStefano Zampini Collective 32266947451fSStefano Zampini 32276947451fSStefano Zampini Input Parameter: 32286947451fSStefano Zampini + mat - the Mat object 32296947451fSStefano Zampini . col - the column index 32306947451fSStefano Zampini - v - the Vec object 32316947451fSStefano Zampini 32326947451fSStefano Zampini Level: intermediate 32336947451fSStefano Zampini 32346947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecWrite() 32356947451fSStefano Zampini @*/ 32366947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecRead(Mat A,PetscInt col,Vec *v) 32376947451fSStefano Zampini { 32386947451fSStefano Zampini PetscErrorCode ierr; 32396947451fSStefano Zampini 32406947451fSStefano Zampini PetscFunctionBegin; 32416947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32426947451fSStefano Zampini PetscValidType(A,1); 32436947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32446947451fSStefano Zampini PetscValidPointer(v,3); 32456947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32466947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32476947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecRead_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32486947451fSStefano Zampini PetscFunctionReturn(0); 32496947451fSStefano Zampini } 32506947451fSStefano Zampini 32516947451fSStefano Zampini /*@C 32526947451fSStefano Zampini MatDenseGetColumnVecWrite - Gives write-only access to a column of a dense matrix, represented as a Vec. 32536947451fSStefano Zampini 32546947451fSStefano Zampini Collective 32556947451fSStefano Zampini 32566947451fSStefano Zampini Input Parameter: 32576947451fSStefano Zampini + mat - the Mat object 32586947451fSStefano Zampini - col - the column index 32596947451fSStefano Zampini 32606947451fSStefano Zampini Output Parameter: 32616947451fSStefano Zampini . v - the vector 32626947451fSStefano Zampini 32636947451fSStefano Zampini Notes: 32646947451fSStefano Zampini The vector is owned by PETSc. Users need to call MatDenseRestoreColumnVecWrite() when the vector is no longer needed. 32656947451fSStefano Zampini Use MatDenseGetColumnVec() to obtain read-write access or MatDenseGetColumnVecRead() for read-only access. 32666947451fSStefano Zampini 32676947451fSStefano Zampini Level: intermediate 32686947451fSStefano Zampini 32696947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead(), MatDenseRestoreColumnVecWrite() 32706947451fSStefano Zampini @*/ 32716947451fSStefano Zampini PetscErrorCode MatDenseGetColumnVecWrite(Mat A,PetscInt col,Vec *v) 32726947451fSStefano Zampini { 32736947451fSStefano Zampini PetscErrorCode ierr; 32746947451fSStefano Zampini 32756947451fSStefano Zampini PetscFunctionBegin; 32766947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 32776947451fSStefano Zampini PetscValidType(A,1); 32786947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 32796947451fSStefano Zampini PetscValidPointer(v,3); 32806947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 32816947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 32826947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseGetColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 32836947451fSStefano Zampini PetscFunctionReturn(0); 32846947451fSStefano Zampini } 32856947451fSStefano Zampini 32866947451fSStefano Zampini /*@C 32876947451fSStefano Zampini MatDenseRestoreColumnVecWrite - Returns access to a column of a dense matrix obtained from MatDenseGetColumnVecWrite(). 32886947451fSStefano Zampini 32896947451fSStefano Zampini Collective 32906947451fSStefano Zampini 32916947451fSStefano Zampini Input Parameter: 32926947451fSStefano Zampini + mat - the Mat object 32936947451fSStefano Zampini . col - the column index 32946947451fSStefano Zampini - v - the Vec object 32956947451fSStefano Zampini 32966947451fSStefano Zampini Level: intermediate 32976947451fSStefano Zampini 32986947451fSStefano Zampini .seealso: MATDENSE, MATDENSECUDA, MatDenseGetColumnVec(), MatDenseGetColumnVecRead(), MatDenseGetColumnVecWrite(), MatDenseRestoreColumnVec(), MatDenseRestoreColumnVecRead() 32996947451fSStefano Zampini @*/ 33006947451fSStefano Zampini PetscErrorCode MatDenseRestoreColumnVecWrite(Mat A,PetscInt col,Vec *v) 33016947451fSStefano Zampini { 33026947451fSStefano Zampini PetscErrorCode ierr; 33036947451fSStefano Zampini 33046947451fSStefano Zampini PetscFunctionBegin; 33056947451fSStefano Zampini PetscValidHeaderSpecific(A,MAT_CLASSID,1); 33066947451fSStefano Zampini PetscValidType(A,1); 33076947451fSStefano Zampini PetscValidLogicalCollectiveInt(A,col,2); 33086947451fSStefano Zampini PetscValidPointer(v,3); 33096947451fSStefano Zampini if (!A->preallocated) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ORDER,"Matrix not preallocated"); 33106947451fSStefano Zampini if (col < 0 || col > A->cmap->N) SETERRQ2(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Invalid col %D, should be in [0,%D)",col,A->cmap->N); 33116947451fSStefano Zampini ierr = PetscUseMethod(A,"MatDenseRestoreColumnVecWrite_C",(Mat,PetscInt,Vec*),(A,col,v));CHKERRQ(ierr); 33126947451fSStefano Zampini PetscFunctionReturn(0); 33136947451fSStefano Zampini } 3314