147d993e7Ssuyashtn /* Portions of this code are under: 247d993e7Ssuyashtn Copyright (c) 2022 Advanced Micro Devices, Inc. All rights reserved. 347d993e7Ssuyashtn */ 46524c165SJacob Faibussowitsch #ifndef __DENSE_H 5f6f390a9SLois Curfman McInnes #define __DENSE_H 6af0996ceSBarry Smith #include <petsc/private/matimpl.h> 76718818eSStefano Zampini /* TODO REMOVE */ 8afea5027SHong Zhang #include <../src/mat/impls/aij/seq/aij.h> /* Mat_MatTransMatMult is defined here */ 9f6f390a9SLois Curfman McInnes 10f6f390a9SLois Curfman McInnes /* 11f6f390a9SLois Curfman McInnes MATSEQDENSE format - conventional dense Fortran storage (by columns) 12f6f390a9SLois Curfman McInnes */ 13f6f390a9SLois Curfman McInnes 14f6f390a9SLois Curfman McInnes typedef struct { 15ea709b57SSatish Balay PetscScalar *v; /* matrix elements */ 16d3042a70SBarry Smith PetscScalar *unplacedarray; /* if one called MatDensePlaceArray(), this is where it stashed the original */ 17ace3abfcSBarry Smith PetscBool roworiented; /* if true, row oriented input (default) */ 1813f74950SBarry Smith PetscInt pad; /* padding */ 194ce68768SBarry Smith PetscBLASInt *pivots; /* pivots in LU factorization */ 20a49dc2a2SStefano Zampini PetscBLASInt lfwork; /* length of work array in factorization */ 21a49dc2a2SStefano Zampini PetscScalar *fwork; /* work array in factorization */ 224905a7bcSToby Isaac PetscScalar *tau; /* scalar factors of QR factorization */ 234396437dSToby Isaac Vec qrrhs; /* RHS for solving with QR (solution vector can't hold copy of RHS) */ 24284134d9SBarry Smith PetscBLASInt lda; /* Lapack leading dimension of data */ 254905a7bcSToby Isaac PetscBLASInt rank; /* numerical rank (of a QR factorized matrix) */ 26ace3abfcSBarry Smith PetscBool user_alloc; /* true if the user provided the dense data */ 27d3042a70SBarry Smith PetscBool unplaced_user_alloc; 286718818eSStefano Zampini 295ea7661aSPierre Jolivet /* Support for MatDenseGetColumnVec and MatDenseGetSubMatrix */ 305ea7661aSPierre Jolivet Mat cmat; /* matrix representation of a given subset of columns */ 316947451fSStefano Zampini Vec cvec; /* vector representation of a given column */ 326947451fSStefano Zampini const PetscScalar *ptrinuse; /* holds array to be restored (just a placeholder) */ 336947451fSStefano Zampini PetscInt vecinuse; /* if cvec is in use (col = vecinuse-1) */ 345ea7661aSPierre Jolivet PetscInt matinuse; /* if cmat is in use (cbegin = matinuse-1) */ 35f6f390a9SLois Curfman McInnes } Mat_SeqDense; 36f6f390a9SLois Curfman McInnes 374222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_SeqDense_SeqDense(Mat, Mat, PetscReal, Mat); 38ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqDense_SeqDense(Mat, Mat, Mat); 394222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatTransposeMatMultSymbolic_SeqDense_SeqDense(Mat, Mat, PetscReal, Mat); 40ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatTransposeMatMultNumeric_SeqDense_SeqDense(Mat, Mat, Mat); 414222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatTransposeMultSymbolic_SeqDense_SeqDense(Mat, Mat, PetscReal, Mat); 42ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMatTransposeMultNumeric_SeqDense_SeqDense(Mat, Mat, Mat); 434222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_SeqAIJ_SeqDense(Mat, Mat, PetscReal, Mat); 44ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqAIJ_SeqDense(Mat, Mat, Mat); 454222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_SeqBAIJ_SeqDense(Mat, Mat, PetscReal, Mat); 46ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqBAIJ_SeqDense(Mat, Mat, Mat); 474222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatMatMultSymbolic_SeqSBAIJ_SeqDense(Mat, Mat, PetscReal, Mat); 48c2916339SPierre Jolivet PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqSBAIJ_SeqDense(Mat, Mat, Mat); 4952c5f739Sprj- PETSC_INTERN PetscErrorCode MatMatMultSymbolic_Nest_Dense(Mat, Mat, PetscReal, Mat *); 5052c5f739Sprj- PETSC_INTERN PetscErrorCode MatMatMultNumeric_Nest_Dense(Mat, Mat, Mat); 51ca15aa20SStefano Zampini 524222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqDense(Mat); 534222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqAIJ_SeqDense(Mat); 544222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqXBAIJ_SeqDense(Mat); 554222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_SeqDense_SeqAIJ(Mat); 564222ddf1SHong Zhang 57*4742e46bSJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatCreate_SeqDense(Mat); 58ca15aa20SStefano Zampini 5947d993e7Ssuyashtn /* Used by SeqDenseCUDA and seqDenseHIP */ 60ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatDuplicateNoCreate_SeqDense(Mat, Mat, MatDuplicateOption); 61ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatNorm_SeqDense(Mat, NormType, PetscReal *); 62ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatView_SeqDense(Mat, PetscViewer); 63ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatDestroy_SeqDense(Mat); 64ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatDenseGetArray_SeqDense(Mat, PetscScalar *[]); 65ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatDenseRestoreArray_SeqDense(Mat, PetscScalar *[]); 66ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatAXPY_SeqDense(Mat, PetscScalar, Mat, MatStructure); 67ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMultTransposeAdd_SeqDense(Mat, Vec, Vec, Vec); 68ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMultTranspose_SeqDense(Mat, Vec, Vec); 69ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMultAdd_SeqDense(Mat, Vec, Vec, Vec); 70ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatMult_SeqDense(Mat, Vec, Vec); 71ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatDuplicate_SeqDense(Mat, MatDuplicateOption, Mat *); 72ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqDenseSetPreallocation_SeqDense(Mat, PetscScalar *); 73ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatCholeskyFactor_SeqDense(Mat, IS, const MatFactorInfo *); 74ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatLUFactor_SeqDense(Mat, IS, IS, const MatFactorInfo *); 75bf5a80bcSToby Isaac PETSC_INTERN PetscErrorCode MatQRFactor_SeqDense(Mat, IS, const MatFactorInfo *); 76ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatCholeskyFactorSymbolic_SeqDense(Mat, Mat, IS, const MatFactorInfo *); 77ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatLUFactorSymbolic_SeqDense(Mat, Mat, IS, IS, const MatFactorInfo *); 78bf5a80bcSToby Isaac PETSC_INTERN PetscErrorCode MatQRFactorSymbolic_SeqDense(Mat, Mat, IS, const MatFactorInfo *); 79ca15aa20SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqDenseSymmetrize_Private(Mat, PetscBool); 80637a0070SStefano Zampini PETSC_INTERN PetscErrorCode MatGetColumnVector_SeqDense(Mat, Vec, PetscInt); 81637a0070SStefano Zampini PETSC_INTERN PetscErrorCode MatScale_SeqDense(Mat, PetscScalar); 82126e4e93SJose E. Roman PETSC_INTERN PetscErrorCode MatShift_SeqDense(Mat, PetscScalar); 836947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseGetColumnVec_SeqDense(Mat, PetscInt, Vec *); 846947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseRestoreColumnVec_SeqDense(Mat, PetscInt, Vec *); 856947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseGetColumnVecRead_SeqDense(Mat, PetscInt, Vec *); 866947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseRestoreColumnVecRead_SeqDense(Mat, PetscInt, Vec *); 876947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseGetColumnVecWrite_SeqDense(Mat, PetscInt, Vec *); 886947451fSStefano Zampini PETSC_INTERN PetscErrorCode MatDenseRestoreColumnVecWrite_SeqDense(Mat, PetscInt, Vec *); 89a2748737SPierre Jolivet PETSC_INTERN PetscErrorCode MatDenseGetSubMatrix_SeqDense(Mat, PetscInt, PetscInt, PetscInt, PetscInt, Mat *); 905ea7661aSPierre Jolivet PETSC_INTERN PetscErrorCode MatDenseRestoreSubMatrix_SeqDense(Mat, Mat *); 9117359960SJose E. Roman PETSC_INTERN PetscErrorCode MatDenseSetLDA_SeqDense(Mat, PetscInt); 92a76f77c3SStefano Zampini PETSC_INTERN PetscErrorCode MatCopy_SeqDense(Mat, Mat, MatStructure); 933d8925e7SStefano Zampini PETSC_INTERN PetscErrorCode MatZeroEntries_SeqDense(Mat); 9475f6d85dSStefano Zampini PETSC_INTERN PetscErrorCode MatSetUp_SeqDense(Mat); 953faff063SStefano Zampini PETSC_INTERN PetscErrorCode MatSetRandom_SeqDense(Mat, PetscRandom); 9618476b09SLois Curfman McInnes 972bf066beSStefano Zampini #if defined(PETSC_HAVE_CUDA) 98*4742e46bSJacob Faibussowitsch PETSC_SINGLE_LIBRARY_INTERN PetscErrorCode MatSeqDenseCUDAInvertFactors_Internal(Mat); 99*4742e46bSJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqDenseCUDA_SeqDenseCUDA_Internal(Mat, Mat, Mat, PetscBool, PetscBool); 1002bf066beSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqDenseCUDA(Mat, MatType, MatReuse, Mat *); 1012bf066beSStefano Zampini #endif 1022bf066beSStefano Zampini 10347d993e7Ssuyashtn #if defined(PETSC_HAVE_HIP) 104*4742e46bSJacob Faibussowitsch PETSC_SINGLE_LIBRARY_INTERN PetscErrorCode MatSeqDenseHIPInvertFactors_Internal(Mat); 105*4742e46bSJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatMatMultNumeric_SeqDenseHIP_SeqDenseHIP_Internal(Mat, Mat, Mat, PetscBool, PetscBool); 10647d993e7Ssuyashtn PETSC_INTERN PetscErrorCode MatConvert_SeqDense_SeqDenseHIP(Mat, MatType, MatReuse, Mat *); 10747d993e7Ssuyashtn #endif 10847d993e7Ssuyashtn 10905709791SSatish Balay PETSC_EXTERN PetscErrorCode MatSeqDenseInvertFactors_Private(Mat); 110ec01deb9SMatthew Knepley 111d528f656SJakub Kruzik PETSC_INTERN PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqDense(MPI_Comm, Mat, PetscInt, MatReuse, Mat *); 112d528f656SJakub Kruzik PETSC_INTERN PetscErrorCode MatCreateMPIMatConcatenateSeqMat_MPIDense(MPI_Comm, Mat, PetscInt, MatReuse, Mat *); 113d528f656SJakub Kruzik 1148491ab44SLisandro Dalcin PETSC_INTERN PetscErrorCode MatView_Dense_Binary(Mat, PetscViewer); 1158491ab44SLisandro Dalcin PETSC_INTERN PetscErrorCode MatLoad_Dense_Binary(Mat, PetscViewer); 116eb91f321SVaclav Hapla PETSC_INTERN PetscErrorCode MatLoad_Dense_HDF5(Mat, PetscViewer); 117f6f390a9SLois Curfman McInnes #endif 118