1ceb9aaf7SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/matimpl.h> /*I "petscmat.h" I*/ 3ceb9aaf7SBarry Smith 4ceb9aaf7SBarry Smith typedef struct { 5ab92ecdeSBarry Smith Mat A,U,V; 6*9d9032efSJose E. Roman Vec work1,work2; /* Sequential vectors that hold partial products */ 7ab92ecdeSBarry Smith PetscMPIInt nwork; /* length of work vectors */ 8ab92ecdeSBarry Smith } Mat_LRC; 9ab92ecdeSBarry Smith 10ab92ecdeSBarry Smith 11cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatMultTranspose_SeqDense(Mat,Vec,Vec); 12cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatMultAdd_SeqDense(Mat,Vec,Vec,Vec); 13ceb9aaf7SBarry Smith 14ceb9aaf7SBarry Smith #undef __FUNCT__ 15ab92ecdeSBarry Smith #define __FUNCT__ "MatMult_LRC" 16ab92ecdeSBarry Smith PetscErrorCode MatMult_LRC(Mat N,Vec x,Vec y) 17ceb9aaf7SBarry Smith { 18ab92ecdeSBarry Smith Mat_LRC *Na = (Mat_LRC*)N->data; 19ceb9aaf7SBarry Smith PetscErrorCode ierr; 20ab92ecdeSBarry Smith PetscScalar *w1,*w2; 21ceb9aaf7SBarry Smith 22ceb9aaf7SBarry Smith PetscFunctionBegin; 23ab92ecdeSBarry Smith ierr = MatMult(Na->A,x,y);CHKERRQ(ierr); 24ab92ecdeSBarry Smith 25ab92ecdeSBarry Smith /* multiply the local part of V with the local part of x */ 26ab92ecdeSBarry Smith /* note in this call x is treated as a sequential vector */ 27cc2e6a90SBarry Smith ierr = MatMultTranspose_SeqDense(Na->V,x,Na->work1);CHKERRQ(ierr); 28ab92ecdeSBarry Smith 29ab92ecdeSBarry Smith /* Form the sum of all the local multiplies : this is work2 = V'*x = 30ab92ecdeSBarry Smith sum_{all processors} work1 */ 31ab92ecdeSBarry Smith 32ab92ecdeSBarry Smith ierr = VecGetArray(Na->work1,&w1);CHKERRQ(ierr); 33ab92ecdeSBarry Smith ierr = VecGetArray(Na->work2,&w2);CHKERRQ(ierr); 34b2566f29SBarry Smith ierr = MPIU_Allreduce(w1,w2,Na->nwork,MPIU_SCALAR,MPIU_SUM,PetscObjectComm((PetscObject)N));CHKERRQ(ierr); 35ab92ecdeSBarry Smith ierr = VecRestoreArray(Na->work1,&w1);CHKERRQ(ierr); 36ab92ecdeSBarry Smith ierr = VecRestoreArray(Na->work2,&w2);CHKERRQ(ierr); 37ab92ecdeSBarry Smith 38ab92ecdeSBarry Smith /* multiply-sub y = y + U*work2 */ 39ab92ecdeSBarry Smith /* note in this call y is treated as a sequential vector */ 40cc2e6a90SBarry Smith ierr = MatMultAdd_SeqDense(Na->U,Na->work2,y,y);CHKERRQ(ierr); 41ceb9aaf7SBarry Smith PetscFunctionReturn(0); 42ceb9aaf7SBarry Smith } 43ceb9aaf7SBarry Smith 44ceb9aaf7SBarry Smith #undef __FUNCT__ 45ab92ecdeSBarry Smith #define __FUNCT__ "MatDestroy_LRC" 46ab92ecdeSBarry Smith PetscErrorCode MatDestroy_LRC(Mat N) 47ceb9aaf7SBarry Smith { 48ab92ecdeSBarry Smith Mat_LRC *Na = (Mat_LRC*)N->data; 49ceb9aaf7SBarry Smith PetscErrorCode ierr; 50ceb9aaf7SBarry Smith 51ceb9aaf7SBarry Smith PetscFunctionBegin; 52bf0cc555SLisandro Dalcin ierr = MatDestroy(&Na->A);CHKERRQ(ierr); 53bf0cc555SLisandro Dalcin ierr = MatDestroy(&Na->U);CHKERRQ(ierr); 54bf0cc555SLisandro Dalcin ierr = MatDestroy(&Na->V);CHKERRQ(ierr); 556bf464f9SBarry Smith ierr = VecDestroy(&Na->work1);CHKERRQ(ierr); 566bf464f9SBarry Smith ierr = VecDestroy(&Na->work2);CHKERRQ(ierr); 57bf0cc555SLisandro Dalcin ierr = PetscFree(N->data);CHKERRQ(ierr); 58ceb9aaf7SBarry Smith PetscFunctionReturn(0); 59ceb9aaf7SBarry Smith } 60ceb9aaf7SBarry Smith 61ceb9aaf7SBarry Smith 62ceb9aaf7SBarry Smith #undef __FUNCT__ 63ab92ecdeSBarry Smith #define __FUNCT__ "MatCreateLRC" 64ceb9aaf7SBarry Smith /*@ 65ab92ecdeSBarry Smith MatCreateLRC - Creates a new matrix object that behaves like A + U*V' 66ceb9aaf7SBarry Smith 67ceb9aaf7SBarry Smith Collective on Mat 68ceb9aaf7SBarry Smith 69*9d9032efSJose E. Roman Input Parameters: 70ab92ecdeSBarry Smith + A - the (sparse) matrix 71*9d9032efSJose E. Roman - U, V - two dense rectangular (tall and skinny) matrices 72ceb9aaf7SBarry Smith 73ceb9aaf7SBarry Smith Output Parameter: 74ab92ecdeSBarry Smith . N - the matrix that represents A + U*V' 75ceb9aaf7SBarry Smith 76*9d9032efSJose E. Roman Notes: 77*9d9032efSJose E. Roman The matrix A + U*V' is not formed! Rather the new matrix 78ceb9aaf7SBarry Smith object performs the matrix-vector product by first multiplying by 79*9d9032efSJose E. Roman A and then adding the other term. 80*9d9032efSJose E. Roman 81*9d9032efSJose E. Roman Level: intermediate 82ceb9aaf7SBarry Smith @*/ 837087cfbeSBarry Smith PetscErrorCode MatCreateLRC(Mat A,Mat U,Mat V,Mat *N) 84ceb9aaf7SBarry Smith { 85ceb9aaf7SBarry Smith PetscErrorCode ierr; 86*9d9032efSJose E. Roman PetscInt m,n,k,m1,n1,k1; 87ab92ecdeSBarry Smith Mat_LRC *Na; 88ceb9aaf7SBarry Smith 89ceb9aaf7SBarry Smith PetscFunctionBegin; 90*9d9032efSJose E. Roman PetscValidHeaderSpecific(A,MAT_CLASSID,1); 91*9d9032efSJose E. Roman PetscValidHeaderSpecific(U,MAT_CLASSID,2); 92*9d9032efSJose E. Roman PetscValidHeaderSpecific(V,MAT_CLASSID,3); 93*9d9032efSJose E. Roman 94*9d9032efSJose E. Roman ierr = MatGetSize(U,NULL,&k);CHKERRQ(ierr); 95*9d9032efSJose E. Roman ierr = MatGetSize(V,NULL,&k1);CHKERRQ(ierr); 96*9d9032efSJose E. Roman if (k!=k1) SETERRQ(PetscObjectComm((PetscObject)U),PETSC_ERR_ARG_INCOMP,"U and V have different number of columns"); 97*9d9032efSJose E. Roman ierr = MatGetLocalSize(U,&m,NULL);CHKERRQ(ierr); 98*9d9032efSJose E. Roman ierr = MatGetLocalSize(V,&n,NULL);CHKERRQ(ierr); 99*9d9032efSJose E. Roman ierr = MatGetLocalSize(A,&m1,&n1);CHKERRQ(ierr); 100*9d9032efSJose E. Roman if (m!=m1) SETERRQ(PetscObjectComm((PetscObject)U),PETSC_ERR_ARG_INCOMP,"Local dimensions of U and A do not match"); 101*9d9032efSJose E. Roman if (n!=n1) SETERRQ(PetscObjectComm((PetscObject)V),PETSC_ERR_ARG_INCOMP,"Local dimensions of V and A do not match"); 102*9d9032efSJose E. Roman 103ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),N);CHKERRQ(ierr); 104*9d9032efSJose E. Roman ierr = MatSetSizes(*N,m,n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 105ab92ecdeSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)*N,MATLRC);CHKERRQ(ierr); 106ceb9aaf7SBarry Smith 107b00a9115SJed Brown ierr = PetscNewLog(*N,&Na);CHKERRQ(ierr); 10838f2d2fdSLisandro Dalcin (*N)->data = (void*)Na; 109ceb9aaf7SBarry Smith Na->A = A; 110ab92ecdeSBarry Smith 111ab92ecdeSBarry Smith ierr = MatDenseGetLocalMatrix(U,&Na->U);CHKERRQ(ierr); 112ab92ecdeSBarry Smith ierr = MatDenseGetLocalMatrix(V,&Na->V);CHKERRQ(ierr); 113ceb9aaf7SBarry Smith ierr = PetscObjectReference((PetscObject)A);CHKERRQ(ierr); 114ab92ecdeSBarry Smith ierr = PetscObjectReference((PetscObject)Na->U);CHKERRQ(ierr); 115ab92ecdeSBarry Smith ierr = PetscObjectReference((PetscObject)Na->V);CHKERRQ(ierr); 116ceb9aaf7SBarry Smith 117d0f46423SBarry Smith ierr = VecCreateSeq(PETSC_COMM_SELF,U->cmap->N,&Na->work1);CHKERRQ(ierr); 118ab92ecdeSBarry Smith ierr = VecDuplicate(Na->work1,&Na->work2);CHKERRQ(ierr); 119d0f46423SBarry Smith Na->nwork = U->cmap->N; 120ab92ecdeSBarry Smith 121ab92ecdeSBarry Smith (*N)->ops->destroy = MatDestroy_LRC; 122ab92ecdeSBarry Smith (*N)->ops->mult = MatMult_LRC; 123ceb9aaf7SBarry Smith (*N)->assembled = PETSC_TRUE; 124*9d9032efSJose E. Roman (*N)->cmap->N = V->rmap->N; 125*9d9032efSJose E. Roman (*N)->rmap->N = U->rmap->N; 126*9d9032efSJose E. Roman (*N)->cmap->n = V->rmap->n; 127*9d9032efSJose E. Roman (*N)->rmap->n = U->rmap->n; 128ceb9aaf7SBarry Smith PetscFunctionReturn(0); 129ceb9aaf7SBarry Smith } 130ceb9aaf7SBarry Smith 131