17a94429cSHong Zhang /* 26718818eSStefano Zampini Defines matrix-matrix product routines for 36718818eSStefano Zampini C = A^T * B and C = A * B^t 46718818eSStefano Zampini with A SeqAIJ and B SeqDense 57a94429cSHong Zhang */ 67a94429cSHong Zhang 77a94429cSHong Zhang #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 8afea5027SHong Zhang #include <../src/mat/impls/dense/seq/dense.h> 9afea5027SHong Zhang 10*cc1eb50dSBarry Smith static PetscErrorCode MatProductCtxDestroy_SeqDense_MatTransMatMult(void **data) 11d71ae5a4SJacob Faibussowitsch { 12*cc1eb50dSBarry Smith MatProductCtx_MatTransMatMult *atb = *(MatProductCtx_MatTransMatMult **)data; 13afea5027SHong Zhang 14afea5027SHong Zhang PetscFunctionBegin; 159566063dSJacob Faibussowitsch PetscCall(MatDestroy(&atb->mA)); 169566063dSJacob Faibussowitsch PetscCall(VecDestroy(&atb->bt)); 179566063dSJacob Faibussowitsch PetscCall(VecDestroy(&atb->ct)); 189566063dSJacob Faibussowitsch PetscCall(PetscFree(atb)); 193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20afea5027SHong Zhang } 217a94429cSHong Zhang 226718818eSStefano Zampini static PetscErrorCode MatTMatTMultNumeric_SeqAIJ_SeqDense(Mat, Mat, Mat); 236718818eSStefano Zampini 24d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatTMatTMultSymbolic_SeqAIJ_SeqDense(Mat A, Mat B, PetscReal fill, Mat C) 25d71ae5a4SJacob Faibussowitsch { 26*cc1eb50dSBarry Smith MatProductCtx_MatTransMatMult *atb; 277a3c3d58SStefano Zampini PetscBool cisdense; 286718818eSStefano Zampini PetscInt dofm; 297a94429cSHong Zhang 307a94429cSHong Zhang PetscFunctionBegin; 316718818eSStefano Zampini MatCheckProduct(C, 4); 3228b400f6SJacob Faibussowitsch PetscCheck(!C->product->data, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Extra product struct not empty"); 33aed4548fSBarry Smith PetscCheck(C->product->type == MATPRODUCT_ABt || C->product->type == MATPRODUCT_AtB, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not for product type %s", MatProductTypes[C->product->type]); 347a94429cSHong Zhang 356718818eSStefano Zampini /* create output dense matrix C */ 366718818eSStefano Zampini if (C->product->type == MATPRODUCT_AtB) { 379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->cmap->n, B->cmap->N, A->cmap->n, B->cmap->N)); 386718818eSStefano Zampini dofm = B->cmap->n; 396718818eSStefano Zampini } else { 409566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->n, B->rmap->N, A->rmap->n, B->rmap->N)); 416718818eSStefano Zampini dofm = B->rmap->n; 426718818eSStefano Zampini } 439566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 4448a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, ((PetscObject)B)->type_name)); 459566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 467a94429cSHong Zhang 476718818eSStefano Zampini /* create additional data structure for the product */ 489566063dSJacob Faibussowitsch PetscCall(PetscNew(&atb)); 499566063dSJacob Faibussowitsch PetscCall(MatCreateMAIJ(A, dofm, &atb->mA)); 509566063dSJacob Faibussowitsch PetscCall(MatCreateVecs(atb->mA, &atb->ct, &atb->bt)); 516718818eSStefano Zampini C->product->data = atb; 52*cc1eb50dSBarry Smith C->product->destroy = MatProductCtxDestroy_SeqDense_MatTransMatMult; 537a94429cSHong Zhang 546718818eSStefano Zampini if (C->product->type == MATPRODUCT_AtB) { 556718818eSStefano Zampini C->ops->transposematmultnumeric = MatTMatTMultNumeric_SeqAIJ_SeqDense; 566718818eSStefano Zampini } else { 576718818eSStefano Zampini C->ops->mattransposemultnumeric = MatTMatTMultNumeric_SeqAIJ_SeqDense; 586718818eSStefano Zampini } 593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 60c608a817SHong Zhang } 61c608a817SHong Zhang 6266976f2fSJacob Faibussowitsch static PetscErrorCode MatTMatTMultNumeric_SeqAIJ_SeqDense(Mat A, Mat B, Mat C) 63d71ae5a4SJacob Faibussowitsch { 646718818eSStefano Zampini PetscInt i, j, m = A->rmap->n, n = A->cmap->n, blda, clda; 656718818eSStefano Zampini PetscInt mdof = C->cmap->N; 666718818eSStefano Zampini const PetscScalar *Barray; 676718818eSStefano Zampini PetscScalar *Carray; 68*cc1eb50dSBarry Smith MatProductCtx_MatTransMatMult *atb; 696718818eSStefano Zampini Vec bt, ct; 70c608a817SHong Zhang 71c608a817SHong Zhang PetscFunctionBegin; 726718818eSStefano Zampini MatCheckProduct(C, 3); 73aed4548fSBarry Smith PetscCheck(C->product->type == MATPRODUCT_ABt || C->product->type == MATPRODUCT_AtB, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not for product type %s", MatProductTypes[C->product->type]); 74*cc1eb50dSBarry Smith atb = (MatProductCtx_MatTransMatMult *)C->product->data; 7528b400f6SJacob Faibussowitsch PetscCheck(atb, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Missing product struct"); 766718818eSStefano Zampini bt = atb->bt; 776718818eSStefano Zampini ct = atb->ct; 78c608a817SHong Zhang 799566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayRead(B, &Barray)); 809566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(B, &blda)); 819566063dSJacob Faibussowitsch PetscCall(MatDenseGetArrayWrite(C, &Carray)); 829566063dSJacob Faibussowitsch PetscCall(MatDenseGetLDA(C, &clda)); 836718818eSStefano Zampini if (C->product->type == MATPRODUCT_AtB) { /* transpose local array of B, then copy it to vector bt */ 846718818eSStefano Zampini const PetscScalar *ctarray; 856718818eSStefano Zampini PetscScalar *btarray; 867a94429cSHong Zhang 879566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(bt, &btarray)); 886718818eSStefano Zampini for (j = 0; j < mdof; j++) { 896718818eSStefano Zampini for (i = 0; i < m; i++) btarray[i * mdof + j] = Barray[j * blda + i]; 907a94429cSHong Zhang } 919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(bt, &btarray)); 927a94429cSHong Zhang 937a94429cSHong Zhang /* compute ct = mA^T * cb */ 949566063dSJacob Faibussowitsch PetscCall(MatMultTranspose(atb->mA, bt, ct)); 957a94429cSHong Zhang 967a3c3d58SStefano Zampini /* transpose local array of ct to matrix C */ 979566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ct, &ctarray)); 986718818eSStefano Zampini for (j = 0; j < mdof; j++) { 996718818eSStefano Zampini for (i = 0; i < n; i++) Carray[j * clda + i] = ctarray[i * mdof + j]; 1007a94429cSHong Zhang } 1019566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ct, &ctarray)); 1026718818eSStefano Zampini } else { 1036718818eSStefano Zampini const PetscScalar *btarray; 1046718818eSStefano Zampini PetscScalar *ctarray; 1056718818eSStefano Zampini 1066718818eSStefano Zampini if (blda == B->rmap->n) { 1079566063dSJacob Faibussowitsch PetscCall(VecPlaceArray(ct, Barray)); 1086718818eSStefano Zampini } else { 1096718818eSStefano Zampini PetscInt bn = B->cmap->n; 1106718818eSStefano Zampini PetscInt bm = B->rmap->n; 1116718818eSStefano Zampini 1129566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(ct, &ctarray)); 1136718818eSStefano Zampini for (j = 0; j < bn; j++) { 1146718818eSStefano Zampini for (i = 0; i < bm; i++) ctarray[j * bm + i] = Barray[j * blda + i]; 1156718818eSStefano Zampini } 1169566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(ct, &ctarray)); 1176718818eSStefano Zampini } 1186718818eSStefano Zampini 1199566063dSJacob Faibussowitsch PetscCall(MatMult(atb->mA, ct, bt)); 12048a46eb9SPierre Jolivet if (blda == B->rmap->n) PetscCall(VecResetArray(ct)); 1219566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bt, &btarray)); 1226718818eSStefano Zampini for (j = 0; j < mdof; j++) { 1236718818eSStefano Zampini for (i = 0; i < m; i++) Carray[j * clda + i] = btarray[i * mdof + j]; 1246718818eSStefano Zampini } 1259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bt, &btarray)); 1266718818eSStefano Zampini } 1279566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArrayRead(B, &Barray)); 1289566063dSJacob Faibussowitsch PetscCall(MatDenseRestoreArray(C, &Carray)); 1293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1307a94429cSHong Zhang } 131