/* Defines basic operations for the MATSEQBAIJMKL matrix class. Uses sparse BLAS operations from the Intel Math Kernel Library (MKL) wherever possible. If used MKL verion is older than 11.3 PETSc default code for sparse matrix operations is used. */ #include <../src/mat/impls/baij/seq/baij.h> #include <../src/mat/impls/baij/seq/baijmkl/baijmkl.h> /* MKL include files. */ #include /* Sparse BLAS */ #ifdef PETSC_HAVE_MKL_SPARSE_OPTIMIZE typedef struct { PetscBool sparse_optimized; /* If PETSC_TRUE, then mkl_sparse_optimize() has been called. */ sparse_matrix_t bsrA; /* "Handle" used by SpMV2 inspector-executor routines. */ struct matrix_descr descr; #ifndef PETSC_MKL_SUPPORTS_BAIJ_ZERO_BASED PetscInt *ai1; PetscInt *aj1; #endif } Mat_SeqBAIJMKL; extern PetscErrorCode MatAssemblyEnd_SeqBAIJ(Mat,MatAssemblyType); PETSC_INTERN PetscErrorCode MatConvert_SeqBAIJMKL_SeqBAIJ(Mat A,MatType type,MatReuse reuse,Mat *newmat) { /* This routine is only called to convert a MATBAIJMKL to its base PETSc type, */ /* so we will ignore 'MatType type'. */ PetscErrorCode ierr; Mat B = *newmat; Mat_SeqBAIJMKL *baijmkl=(Mat_SeqBAIJMKL*)A->spptr; PetscFunctionBegin; if (reuse == MAT_INITIAL_MATRIX) { ierr = MatDuplicate(A,MAT_COPY_VALUES,&B);CHKERRQ(ierr); } /* Reset the original function pointers. */ B->ops->duplicate = MatDuplicate_SeqBAIJ; B->ops->assemblyend = MatAssemblyEnd_SeqBAIJ; B->ops->destroy = MatDestroy_SeqBAIJ; B->ops->multtranspose = MatMultTranspose_SeqBAIJ; B->ops->multtransposeadd = MatMultTransposeAdd_SeqBAIJ; B->ops->scale = MatScale_SeqBAIJ; B->ops->diagonalscale = MatDiagonalScale_SeqBAIJ; B->ops->axpy = MatAXPY_SeqBAIJ; switch (A->rmap->bs) { case 1: B->ops->mult = MatMult_SeqBAIJ_1; B->ops->multadd = MatMultAdd_SeqBAIJ_1; break; case 2: B->ops->mult = MatMult_SeqBAIJ_2; B->ops->multadd = MatMultAdd_SeqBAIJ_2; break; case 3: B->ops->mult = MatMult_SeqBAIJ_3; B->ops->multadd = MatMultAdd_SeqBAIJ_3; break; case 4: B->ops->mult = MatMult_SeqBAIJ_4; B->ops->multadd = MatMultAdd_SeqBAIJ_4; break; case 5: B->ops->mult = MatMult_SeqBAIJ_5; B->ops->multadd = MatMultAdd_SeqBAIJ_5; break; case 6: B->ops->mult = MatMult_SeqBAIJ_6; B->ops->multadd = MatMultAdd_SeqBAIJ_6; break; case 7: B->ops->mult = MatMult_SeqBAIJ_7; B->ops->multadd = MatMultAdd_SeqBAIJ_7; break; case 11: B->ops->mult = MatMult_SeqBAIJ_11; B->ops->multadd = MatMultAdd_SeqBAIJ_11; break; case 15: B->ops->mult = MatMult_SeqBAIJ_15_ver1; B->ops->multadd = MatMultAdd_SeqBAIJ_N; break; default: B->ops->mult = MatMult_SeqBAIJ_N; B->ops->multadd = MatMultAdd_SeqBAIJ_N; break; } ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqbaijmkl_seqbaij_C",NULL);CHKERRQ(ierr); /* Free everything in the Mat_SeqBAIJMKL data structure. Currently, this * simply involves destroying the MKL sparse matrix handle and then freeing * the spptr pointer. */ if (reuse == MAT_INITIAL_MATRIX) baijmkl = (Mat_SeqBAIJMKL*)B->spptr; if (baijmkl->sparse_optimized) { sparse_status_t stat; stat = mkl_sparse_destroy(baijmkl->bsrA); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } } #ifndef PETSC_MKL_SUPPORTS_BAIJ_ZERO_BASED ierr = PetscFree(baijmkl->ai1);CHKERRQ(ierr); ierr = PetscFree(baijmkl->aj1);CHKERRQ(ierr); #endif ierr = PetscFree(B->spptr);CHKERRQ(ierr); /* Change the type of B to MATSEQBAIJ. */ ierr = PetscObjectChangeTypeName((PetscObject)B, MATSEQBAIJ);CHKERRQ(ierr); *newmat = B; PetscFunctionReturn(0); } PetscErrorCode MatDestroy_SeqBAIJMKL(Mat A) { PetscErrorCode ierr; Mat_SeqBAIJMKL *baijmkl = (Mat_SeqBAIJMKL*) A->spptr; PetscFunctionBegin; if (baijmkl) { /* Clean up everything in the Mat_SeqBAIJMKL data structure, then free A->spptr. */ if (baijmkl->sparse_optimized) { sparse_status_t stat = SPARSE_STATUS_SUCCESS; stat = mkl_sparse_destroy(baijmkl->bsrA); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } } #ifndef PETSC_MKL_SUPPORTS_BAIJ_ZERO_BASED ierr = PetscFree(baijmkl->ai1);CHKERRQ(ierr); ierr = PetscFree(baijmkl->aj1);CHKERRQ(ierr); #endif ierr = PetscFree(A->spptr);CHKERRQ(ierr); } /* Change the type of A back to SEQBAIJ and use MatDestroy_SeqBAIJ() * to destroy everything that remains. */ ierr = PetscObjectChangeTypeName((PetscObject)A, MATSEQBAIJ);CHKERRQ(ierr); ierr = MatDestroy_SeqBAIJ(A);CHKERRQ(ierr); PetscFunctionReturn(0); } PETSC_INTERN PetscErrorCode MatSeqBAIJMKL_create_mkl_handle(Mat A) { PetscErrorCode ierr; Mat_SeqBAIJ *a = (Mat_SeqBAIJ*)A->data; Mat_SeqBAIJMKL *baijmkl = (Mat_SeqBAIJMKL*)A->spptr; PetscInt mbs, nbs, nz, bs, i; MatScalar *aa; PetscInt *aj,*ai; sparse_status_t stat; PetscFunctionBegin; if (baijmkl->sparse_optimized) { /* Matrix has been previously assembled and optimized. Must destroy old * matrix handle before running the optimization step again. */ stat = mkl_sparse_destroy(baijmkl->bsrA); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } } baijmkl->sparse_optimized = PETSC_FALSE; /* Now perform the SpMV2 setup and matrix optimization. */ baijmkl->descr.type = SPARSE_MATRIX_TYPE_GENERAL; baijmkl->descr.mode = SPARSE_FILL_MODE_LOWER; baijmkl->descr.diag = SPARSE_DIAG_NON_UNIT; mbs = a->mbs; nbs = a->nbs; nz = a->nz; bs = A->rmap->bs; aa = a->a; if (nz) { /* Create a new, optimized sparse matrix handle only if the matrix has nonzero entries. * The MKL sparse-inspector executor routines don't like being passed an empty matrix. */ #ifdef PETSC_MKL_SUPPORTS_BAIJ_ZERO_BASED aj = a->j; ai = a->i; stat = mkl_sparse_x_create_bsr(&(baijmkl->bsrA),SPARSE_INDEX_BASE_ZERO,SPARSE_LAYOUT_COLUMN_MAJOR,mbs,nbs,bs,ai,ai+1,aj,aa); #else ierr = PetscMalloc1(mbs+1,&ai);CHKERRQ(ierr); ierr = PetscMalloc1(nz,&aj);CHKERRQ(ierr); for (i=0;ii[i]+1; for (i=0;ij[i]+1; aa = a->a; stat = mkl_sparse_x_create_bsr(&baijmkl->bsrA,SPARSE_INDEX_BASE_ONE,SPARSE_LAYOUT_COLUMN_MAJOR,mbs,nbs,bs,ai,ai+1,aj,aa); baijmkl->ai1 = ai; baijmkl->aj1 = aj; #endif stat = mkl_sparse_set_mv_hint(baijmkl->bsrA,SPARSE_OPERATION_NON_TRANSPOSE,baijmkl->descr,1000); stat = mkl_sparse_set_memory_hint(baijmkl->bsrA,SPARSE_MEMORY_AGGRESSIVE); stat = mkl_sparse_optimize(baijmkl->bsrA); if (stat != SPARSE_STATUS_SUCCESS) { SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"Intel MKL error: unable to create matrix handle/complete mkl_sparse_optimize"); PetscFunctionReturn(PETSC_ERR_LIB); } baijmkl->sparse_optimized = PETSC_TRUE; } PetscFunctionReturn(0); } PetscErrorCode MatDuplicate_SeqBAIJMKL(Mat A, MatDuplicateOption op, Mat *M) { PetscErrorCode ierr; Mat_SeqBAIJMKL *baijmkl; Mat_SeqBAIJMKL *baijmkl_dest; PetscFunctionBegin; ierr = MatDuplicate_SeqBAIJ(A,op,M);CHKERRQ(ierr); baijmkl = (Mat_SeqBAIJMKL*) A->spptr; baijmkl_dest = (Mat_SeqBAIJMKL*) (*M)->spptr; ierr = PetscMemcpy(baijmkl_dest,baijmkl,sizeof(Mat_SeqBAIJMKL));CHKERRQ(ierr); baijmkl_dest->sparse_optimized = PETSC_FALSE; ierr = MatSeqBAIJMKL_create_mkl_handle(A);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatAssemblyEnd_SeqBAIJMKL(Mat A, MatAssemblyType mode) { PetscErrorCode ierr; PetscFunctionBegin; if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); ierr = MatAssemblyEnd_SeqBAIJ(A, mode);CHKERRQ(ierr); ierr = MatSeqBAIJMKL_create_mkl_handle(A);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatMult_SeqBAIJMKL_SpMV2(Mat A,Vec xx,Vec yy) { Mat_SeqBAIJ *a = (Mat_SeqBAIJ*)A->data; Mat_SeqBAIJMKL *baijmkl=(Mat_SeqBAIJMKL*)A->spptr; const PetscScalar *x; PetscScalar *y; PetscErrorCode ierr; sparse_status_t stat = SPARSE_STATUS_SUCCESS; PetscFunctionBegin; /* If there are no nonzero entries, zero yy and return immediately. */ if(!a->nz) { PetscInt i; PetscInt m=a->mbs*A->rmap->bs; ierr = VecGetArray(yy,&y);CHKERRQ(ierr); for (i=0; isparse_optimized) { MatSeqBAIJMKL_create_mkl_handle(A); } /* Call MKL SpMV2 executor routine to do the MatMult. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_NON_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,0.0,y); ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } PetscFunctionReturn(0); } PetscErrorCode MatMultTranspose_SeqBAIJMKL_SpMV2(Mat A,Vec xx,Vec yy) { Mat_SeqBAIJ *a = (Mat_SeqBAIJ*)A->data; Mat_SeqBAIJMKL *baijmkl=(Mat_SeqBAIJMKL*)A->spptr; const PetscScalar *x; PetscScalar *y; PetscErrorCode ierr; sparse_status_t stat; PetscFunctionBegin; /* If there are no nonzero entries, zero yy and return immediately. */ if(!a->nz) { PetscInt i; PetscInt n=a->nbs; ierr = VecGetArray(yy,&y);CHKERRQ(ierr); for (i=0; isparse_optimized) { MatSeqBAIJMKL_create_mkl_handle(A); } /* Call MKL SpMV2 executor routine to do the MatMultTranspose. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,0.0,y); ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } PetscFunctionReturn(0); } PetscErrorCode MatMultAdd_SeqBAIJMKL_SpMV2(Mat A,Vec xx,Vec yy,Vec zz) { Mat_SeqBAIJ *a = (Mat_SeqBAIJ*)A->data; Mat_SeqBAIJMKL *baijmkl=(Mat_SeqBAIJMKL*)A->spptr; const PetscScalar *x; PetscScalar *y,*z; PetscErrorCode ierr; PetscInt m=a->mbs*A->rmap->bs; PetscInt i; sparse_status_t stat = SPARSE_STATUS_SUCCESS; PetscFunctionBegin; /* If there are no nonzero entries, set zz = yy and return immediately. */ if(!a->nz) { PetscInt i; ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); for (i=0; isparse_optimized) { MatSeqBAIJMKL_create_mkl_handle(A); } /* Call MKL sparse BLAS routine to do the MatMult. */ if (zz == yy) { /* If zz and yy are the same vector, we can use mkl_sparse_x_mv, which calculates y = alpha*A*x + beta*y, * with alpha and beta both set to 1.0. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_NON_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,1.0,z); } else { /* zz and yy are different vectors, so we call mkl_sparse_x_mv with alpha=1.0 and beta=0.0, and then * we add the contents of vector yy to the result; MKL sparse BLAS does not have a MatMultAdd equivalent. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_NON_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,0.0,z); for (i=0; inz);CHKERRQ(ierr); ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } PetscFunctionReturn(0); } PetscErrorCode MatMultTransposeAdd_SeqBAIJMKL_SpMV2(Mat A,Vec xx,Vec yy,Vec zz) { Mat_SeqBAIJ *a = (Mat_SeqBAIJ*)A->data; Mat_SeqBAIJMKL *baijmkl=(Mat_SeqBAIJMKL*)A->spptr; const PetscScalar *x; PetscScalar *y,*z; PetscErrorCode ierr; PetscInt n=a->nbs*A->rmap->bs; PetscInt i; /* Variables not in MatMultTransposeAdd_SeqBAIJ. */ sparse_status_t stat = SPARSE_STATUS_SUCCESS; PetscFunctionBegin; /* If there are no nonzero entries, set zz = yy and return immediately. */ if(!a->nz) { PetscInt i; ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); for (i=0; isparse_optimized) { MatSeqBAIJMKL_create_mkl_handle(A); } /* Call MKL sparse BLAS routine to do the MatMult. */ if (zz == yy) { /* If zz and yy are the same vector, we can use mkl_sparse_x_mv, which calculates y = alpha*A*x + beta*y, * with alpha and beta both set to 1.0. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,1.0,z); } else { /* zz and yy are different vectors, so we call mkl_sparse_x_mv with alpha=1.0 and beta=0.0, and then * we add the contents of vector yy to the result; MKL sparse BLAS does not have a MatMultAdd equivalent. */ stat = mkl_sparse_x_mv(SPARSE_OPERATION_TRANSPOSE,1.0,baijmkl->bsrA,baijmkl->descr,x,0.0,z); for (i=0; inz);CHKERRQ(ierr); ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); if (stat != SPARSE_STATUS_SUCCESS) { PetscFunctionReturn(PETSC_ERR_LIB); } PetscFunctionReturn(0); } PetscErrorCode MatScale_SeqBAIJMKL(Mat inA,PetscScalar alpha) { PetscErrorCode ierr; PetscFunctionBegin; ierr = MatScale_SeqBAIJ(inA,alpha);CHKERRQ(ierr); ierr = MatSeqBAIJMKL_create_mkl_handle(inA);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatDiagonalScale_SeqBAIJMKL(Mat A,Vec ll,Vec rr) { PetscErrorCode ierr; PetscFunctionBegin; ierr = MatDiagonalScale_SeqBAIJ(A,ll,rr);CHKERRQ(ierr); ierr = MatSeqBAIJMKL_create_mkl_handle(A);CHKERRQ(ierr); PetscFunctionReturn(0); } PetscErrorCode MatAXPY_SeqBAIJMKL(Mat Y,PetscScalar a,Mat X,MatStructure str) { PetscErrorCode ierr; PetscFunctionBegin; ierr = MatAXPY_SeqBAIJ(Y,a,X,str);CHKERRQ(ierr); if (str == SAME_NONZERO_PATTERN) { /* MatAssemblyEnd() is not called if SAME_NONZERO_PATTERN, so we need to force update of the MKL matrix handle. */ ierr = MatSeqBAIJMKL_create_mkl_handle(Y);CHKERRQ(ierr); } PetscFunctionReturn(0); } /* MatConvert_SeqBAIJ_SeqBAIJMKL converts a SeqBAIJ matrix into a * SeqBAIJMKL matrix. This routine is called by the MatCreate_SeqMKLBAIJ() * routine, but can also be used to convert an assembled SeqBAIJ matrix * into a SeqBAIJMKL one. */ PETSC_INTERN PetscErrorCode MatConvert_SeqBAIJ_SeqBAIJMKL(Mat A,MatType type,MatReuse reuse,Mat *newmat) { PetscErrorCode ierr; Mat B = *newmat; Mat_SeqBAIJMKL *baijmkl; PetscBool sametype; PetscFunctionBegin; if (reuse == MAT_INITIAL_MATRIX) { ierr = MatDuplicate(A,MAT_COPY_VALUES,&B);CHKERRQ(ierr); } ierr = PetscObjectTypeCompare((PetscObject)A,type,&sametype);CHKERRQ(ierr); if (sametype) PetscFunctionReturn(0); ierr = PetscNewLog(B,&baijmkl);CHKERRQ(ierr); B->spptr = (void*) baijmkl; /* Set function pointers for methods that we inherit from BAIJ but override. * We also parse some command line options below, since those determine some of the methods we point to. */ B->ops->duplicate = MatDuplicate_SeqBAIJMKL; B->ops->assemblyend = MatAssemblyEnd_SeqBAIJMKL; B->ops->destroy = MatDestroy_SeqBAIJMKL; B->ops->mult = MatMult_SeqBAIJMKL_SpMV2; B->ops->multtranspose = MatMultTranspose_SeqBAIJMKL_SpMV2; B->ops->multadd = MatMultAdd_SeqBAIJMKL_SpMV2; B->ops->multtransposeadd = MatMultTransposeAdd_SeqBAIJMKL_SpMV2; B->ops->scale = MatScale_SeqBAIJMKL; B->ops->diagonalscale = MatDiagonalScale_SeqBAIJMKL; B->ops->axpy = MatAXPY_SeqBAIJMKL; baijmkl->sparse_optimized = PETSC_FALSE; ierr = PetscObjectComposeFunction((PetscObject)B,"MatScale_SeqBAIJMKL_C",MatScale_SeqBAIJMKL);CHKERRQ(ierr); ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqbaijmkl_seqbaij_C",MatConvert_SeqBAIJMKL_SeqBAIJ);CHKERRQ(ierr); ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQBAIJMKL);CHKERRQ(ierr); *newmat = B; PetscFunctionReturn(0); } #endif /* PETSC_HAVE_MKL_SPARSE_OPTIMIZE */ /*@C MatCreateSeqBAIJMKL - Creates a sparse matrix of type SEQBAIJMKL. This type inherits from BAIJ and is largely identical, but uses sparse BLAS routines from Intel MKL whenever possible. MatMult, MatMultAdd, MatMultTranspose, and MatMultTransposeAdd operations are currently supported. If the installed version of MKL supports the "SpMV2" sparse inspector-executor routines, then those are used by default. Default PETSc kernels are used otherwise. Input Parameters: + comm - MPI communicator, set to PETSC_COMM_SELF . bs - size of block, the blocks are ALWAYS square. One can use MatSetBlockSizes() to set a different row and column blocksize but the row blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() . m - number of rows . n - number of columns . nz - number of nonzero blocks per block row (same for all rows) - nnz - array containing the number of nonzero blocks in the various block rows (possibly different for each block row) or NULL Output Parameter: . A - the matrix It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), MatXXXXSetPreallocation() paradgm instead of this routine directly. [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] Options Database Keys: . -mat_no_unroll - uses code that does not unroll the loops in the block calculations (much slower) . -mat_block_size - size of the blocks to use Level: intermediate Notes: The number of rows and columns must be divisible by blocksize. If the nnz parameter is given then the nz parameter is ignored A nonzero block is any block that as 1 or more nonzeros in it The block AIJ format is fully compatible with standard Fortran 77 storage. That is, the stored row and column indices can begin at either one (as in Fortran) or zero. See the users' manual for details. Specify the preallocated storage with either nz or nnz (not both). Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory allocation. See Users-Manual: ch_mat for details. matrices. .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatCreateBAIJ() @*/ PetscErrorCode MatCreateSeqBAIJMKL(MPI_Comm comm,PetscInt bs,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) { PetscErrorCode ierr; PetscFunctionBegin; ierr = MatCreate(comm,A);CHKERRQ(ierr); ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); #ifdef PETSC_HAVE_MKL_SPARSE_OPTIMIZE ierr = MatSetType(*A,MATSEQBAIJMKL);CHKERRQ(ierr); ierr = MatSeqBAIJSetPreallocation_SeqBAIJ(*A,bs,nz,(PetscInt*)nnz);CHKERRQ(ierr); #else ierr = PetscInfo(A,"MKL baij routines are not supported for used version of MKL. Using PETSc default routines. \n Please use version of MKL 11.3 and higher. \n"); ierr = MatSetType(*A,MATSEQBAIJ);CHKERRQ(ierr); ierr = MatSeqBAIJSetPreallocation(*A,bs,nz,(PetscInt*)nnz);CHKERRQ(ierr); #endif PetscFunctionReturn(0); } PETSC_EXTERN PetscErrorCode MatCreate_SeqBAIJMKL(Mat A) { PetscErrorCode ierr; PetscFunctionBegin; ierr = MatSetType(A,MATSEQBAIJ);CHKERRQ(ierr); #ifdef PETSC_HAVE_MKL_SPARSE_OPTIMIZE ierr = MatConvert_SeqBAIJ_SeqBAIJMKL(A,MATSEQBAIJMKL,MAT_INPLACE_MATRIX,&A);CHKERRQ(ierr); #else ierr = PetscInfo(A,"MKL baij routines are not supported for used version of MKL. Using PETSc default routines. \n Please use version of MKL 11.3 and higher. \n"); #endif PetscFunctionReturn(0); }