173f4d377SMatthew Knepley /*$Id: mpidense.c,v 1.159 2001/08/10 03:30:41 bsmith Exp $*/ 28965ea79SLois Curfman McInnes 3ed3cc1f0SBarry Smith /* 4ed3cc1f0SBarry Smith Basic functions for basic parallel dense matrices. 5ed3cc1f0SBarry Smith */ 6ed3cc1f0SBarry Smith 770f55243SBarry Smith #include "src/mat/impls/dense/mpi/mpidense.h" 88965ea79SLois Curfman McInnes 90de54da6SSatish Balay EXTERN_C_BEGIN 104a2ae208SSatish Balay #undef __FUNCT__ 114a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonalBlock_MPIDense" 120de54da6SSatish Balay int MatGetDiagonalBlock_MPIDense(Mat A,PetscTruth *iscopy,MatReuse reuse,Mat *B) 130de54da6SSatish Balay { 140de54da6SSatish Balay Mat_MPIDense *mdn = (Mat_MPIDense*)A->data; 15cfce73b9SSatish Balay int m = A->m,rstart = mdn->rstart,ierr; 1687828ca2SBarry Smith PetscScalar *array; 170de54da6SSatish Balay MPI_Comm comm; 180de54da6SSatish Balay 190de54da6SSatish Balay PetscFunctionBegin; 20273d9f13SBarry Smith if (A->M != A->N) SETERRQ(PETSC_ERR_SUP,"Only square matrices supported."); 210de54da6SSatish Balay 220de54da6SSatish Balay /* The reuse aspect is not implemented efficiently */ 230de54da6SSatish Balay if (reuse) { ierr = MatDestroy(*B);CHKERRQ(ierr);} 240de54da6SSatish Balay 250de54da6SSatish Balay ierr = PetscObjectGetComm((PetscObject)(mdn->A),&comm);CHKERRQ(ierr); 260de54da6SSatish Balay ierr = MatGetArray(mdn->A,&array);CHKERRQ(ierr); 275c5985e7SKris Buschelman ierr = MatCreate(comm,m,m,m,m,B);CHKERRQ(ierr); 285c5985e7SKris Buschelman ierr = MatSetType(*B,mdn->A->type_name);CHKERRQ(ierr); 295c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(*B,array+m*rstart);CHKERRQ(ierr); 300de54da6SSatish Balay ierr = MatRestoreArray(mdn->A,&array);CHKERRQ(ierr); 310de54da6SSatish Balay ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 320de54da6SSatish Balay ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 330de54da6SSatish Balay 340de54da6SSatish Balay *iscopy = PETSC_TRUE; 350de54da6SSatish Balay PetscFunctionReturn(0); 360de54da6SSatish Balay } 370de54da6SSatish Balay EXTERN_C_END 380de54da6SSatish Balay 394a2ae208SSatish Balay #undef __FUNCT__ 404a2ae208SSatish Balay #define __FUNCT__ "MatSetValues_MPIDense" 41f15d580aSBarry Smith int MatSetValues_MPIDense(Mat mat,int m,const int idxm[],int n,const int idxn[],const PetscScalar v[],InsertMode addv) 428965ea79SLois Curfman McInnes { 4339b7565bSBarry Smith Mat_MPIDense *A = (Mat_MPIDense*)mat->data; 4439b7565bSBarry Smith int ierr,i,j,rstart = A->rstart,rend = A->rend,row; 45273d9f13SBarry Smith PetscTruth roworiented = A->roworiented; 468965ea79SLois Curfman McInnes 473a40ed3dSBarry Smith PetscFunctionBegin; 488965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 495ef9f2a5SBarry Smith if (idxm[i] < 0) continue; 50273d9f13SBarry Smith if (idxm[i] >= mat->M) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 518965ea79SLois Curfman McInnes if (idxm[i] >= rstart && idxm[i] < rend) { 528965ea79SLois Curfman McInnes row = idxm[i] - rstart; 5339b7565bSBarry Smith if (roworiented) { 5439b7565bSBarry Smith ierr = MatSetValues(A->A,1,&row,n,idxn,v+i*n,addv);CHKERRQ(ierr); 553a40ed3dSBarry Smith } else { 568965ea79SLois Curfman McInnes for (j=0; j<n; j++) { 575ef9f2a5SBarry Smith if (idxn[j] < 0) continue; 58273d9f13SBarry Smith if (idxn[j] >= mat->N) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 5939b7565bSBarry Smith ierr = MatSetValues(A->A,1,&row,1,&idxn[j],v+i+j*m,addv);CHKERRQ(ierr); 6039b7565bSBarry Smith } 618965ea79SLois Curfman McInnes } 623a40ed3dSBarry Smith } else { 633782ba37SSatish Balay if (!A->donotstash) { 6439b7565bSBarry Smith if (roworiented) { 658798bf22SSatish Balay ierr = MatStashValuesRow_Private(&mat->stash,idxm[i],n,idxn,v+i*n);CHKERRQ(ierr); 66d36fbae8SSatish Balay } else { 678798bf22SSatish Balay ierr = MatStashValuesCol_Private(&mat->stash,idxm[i],n,idxn,v+i,m);CHKERRQ(ierr); 6839b7565bSBarry Smith } 69b49de8d1SLois Curfman McInnes } 70b49de8d1SLois Curfman McInnes } 713782ba37SSatish Balay } 723a40ed3dSBarry Smith PetscFunctionReturn(0); 73b49de8d1SLois Curfman McInnes } 74b49de8d1SLois Curfman McInnes 754a2ae208SSatish Balay #undef __FUNCT__ 764a2ae208SSatish Balay #define __FUNCT__ "MatGetValues_MPIDense" 77f15d580aSBarry Smith int MatGetValues_MPIDense(Mat mat,int m,const int idxm[],int n,const int idxn[],PetscScalar v[]) 78b49de8d1SLois Curfman McInnes { 79b49de8d1SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 80b49de8d1SLois Curfman McInnes int ierr,i,j,rstart = mdn->rstart,rend = mdn->rend,row; 81b49de8d1SLois Curfman McInnes 823a40ed3dSBarry Smith PetscFunctionBegin; 83b49de8d1SLois Curfman McInnes for (i=0; i<m; i++) { 8429bbc08cSBarry Smith if (idxm[i] < 0) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Negative row"); 85273d9f13SBarry Smith if (idxm[i] >= mat->M) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 86b49de8d1SLois Curfman McInnes if (idxm[i] >= rstart && idxm[i] < rend) { 87b49de8d1SLois Curfman McInnes row = idxm[i] - rstart; 88b49de8d1SLois Curfman McInnes for (j=0; j<n; j++) { 8929bbc08cSBarry Smith if (idxn[j] < 0) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Negative column"); 90273d9f13SBarry Smith if (idxn[j] >= mat->N) { 9129bbc08cSBarry Smith SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 92a8c6a408SBarry Smith } 93b49de8d1SLois Curfman McInnes ierr = MatGetValues(mdn->A,1,&row,1,&idxn[j],v+i*n+j);CHKERRQ(ierr); 94b49de8d1SLois Curfman McInnes } 95a8c6a408SBarry Smith } else { 9629bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"Only local values currently supported"); 978965ea79SLois Curfman McInnes } 988965ea79SLois Curfman McInnes } 993a40ed3dSBarry Smith PetscFunctionReturn(0); 1008965ea79SLois Curfman McInnes } 1018965ea79SLois Curfman McInnes 1024a2ae208SSatish Balay #undef __FUNCT__ 1034a2ae208SSatish Balay #define __FUNCT__ "MatGetArray_MPIDense" 1044e7234bfSBarry Smith int MatGetArray_MPIDense(Mat A,PetscScalar *array[]) 105ff14e315SSatish Balay { 106ff14e315SSatish Balay Mat_MPIDense *a = (Mat_MPIDense*)A->data; 107ff14e315SSatish Balay int ierr; 108ff14e315SSatish Balay 1093a40ed3dSBarry Smith PetscFunctionBegin; 110ff14e315SSatish Balay ierr = MatGetArray(a->A,array);CHKERRQ(ierr); 1113a40ed3dSBarry Smith PetscFunctionReturn(0); 112ff14e315SSatish Balay } 113ff14e315SSatish Balay 1144a2ae208SSatish Balay #undef __FUNCT__ 1154a2ae208SSatish Balay #define __FUNCT__ "MatGetSubMatrix_MPIDense" 116ca3fa75bSLois Curfman McInnes static int MatGetSubMatrix_MPIDense(Mat A,IS isrow,IS iscol,int cs,MatReuse scall,Mat *B) 117ca3fa75bSLois Curfman McInnes { 118ca3fa75bSLois Curfman McInnes Mat_MPIDense *mat = (Mat_MPIDense*)A->data,*newmatd; 119ca3fa75bSLois Curfman McInnes Mat_SeqDense *lmat = (Mat_SeqDense*)mat->A->data; 120cfce73b9SSatish Balay int i,j,ierr,*irow,*icol,rstart,rend,nrows,ncols,nlrows,nlcols; 12187828ca2SBarry Smith PetscScalar *av,*bv,*v = lmat->v; 122ca3fa75bSLois Curfman McInnes Mat newmat; 123ca3fa75bSLois Curfman McInnes 124ca3fa75bSLois Curfman McInnes PetscFunctionBegin; 125ca3fa75bSLois Curfman McInnes ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 126ca3fa75bSLois Curfman McInnes ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 127b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 128b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 129ca3fa75bSLois Curfman McInnes 130ca3fa75bSLois Curfman McInnes /* No parallel redistribution currently supported! Should really check each index set 1317eba5e9cSLois Curfman McInnes to comfirm that it is OK. ... Currently supports only submatrix same partitioning as 1327eba5e9cSLois Curfman McInnes original matrix! */ 133ca3fa75bSLois Curfman McInnes 134ca3fa75bSLois Curfman McInnes ierr = MatGetLocalSize(A,&nlrows,&nlcols);CHKERRQ(ierr); 1357eba5e9cSLois Curfman McInnes ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 136ca3fa75bSLois Curfman McInnes 137ca3fa75bSLois Curfman McInnes /* Check submatrix call */ 138ca3fa75bSLois Curfman McInnes if (scall == MAT_REUSE_MATRIX) { 13929bbc08cSBarry Smith /* SETERRQ(PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); */ 1407eba5e9cSLois Curfman McInnes /* Really need to test rows and column sizes! */ 141ca3fa75bSLois Curfman McInnes newmat = *B; 142ca3fa75bSLois Curfman McInnes } else { 143ca3fa75bSLois Curfman McInnes /* Create and fill new matrix */ 144878740d9SKris Buschelman ierr = MatCreate(A->comm,nrows,cs,PETSC_DECIDE,ncols,&newmat);CHKERRQ(ierr); 145878740d9SKris Buschelman ierr = MatSetType(newmat,A->type_name);CHKERRQ(ierr); 146878740d9SKris Buschelman ierr = MatMPIDenseSetPreallocation(newmat,PETSC_NULL);CHKERRQ(ierr); 147ca3fa75bSLois Curfman McInnes } 148ca3fa75bSLois Curfman McInnes 149ca3fa75bSLois Curfman McInnes /* Now extract the data pointers and do the copy, column at a time */ 150ca3fa75bSLois Curfman McInnes newmatd = (Mat_MPIDense*)newmat->data; 151ca3fa75bSLois Curfman McInnes bv = ((Mat_SeqDense *)newmatd->A->data)->v; 152ca3fa75bSLois Curfman McInnes 153ca3fa75bSLois Curfman McInnes for (i=0; i<ncols; i++) { 154ca3fa75bSLois Curfman McInnes av = v + nlrows*icol[i]; 155ca3fa75bSLois Curfman McInnes for (j=0; j<nrows; j++) { 1567eba5e9cSLois Curfman McInnes *bv++ = av[irow[j] - rstart]; 157ca3fa75bSLois Curfman McInnes } 158ca3fa75bSLois Curfman McInnes } 159ca3fa75bSLois Curfman McInnes 160ca3fa75bSLois Curfman McInnes /* Assemble the matrices so that the correct flags are set */ 161ca3fa75bSLois Curfman McInnes ierr = MatAssemblyBegin(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 162ca3fa75bSLois Curfman McInnes ierr = MatAssemblyEnd(newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 163ca3fa75bSLois Curfman McInnes 164ca3fa75bSLois Curfman McInnes /* Free work space */ 165ca3fa75bSLois Curfman McInnes ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 166ca3fa75bSLois Curfman McInnes ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 167ca3fa75bSLois Curfman McInnes *B = newmat; 168ca3fa75bSLois Curfman McInnes PetscFunctionReturn(0); 169ca3fa75bSLois Curfman McInnes } 170ca3fa75bSLois Curfman McInnes 1714a2ae208SSatish Balay #undef __FUNCT__ 1724a2ae208SSatish Balay #define __FUNCT__ "MatRestoreArray_MPIDense" 1734e7234bfSBarry Smith int MatRestoreArray_MPIDense(Mat A,PetscScalar *array[]) 174ff14e315SSatish Balay { 1753a40ed3dSBarry Smith PetscFunctionBegin; 1763a40ed3dSBarry Smith PetscFunctionReturn(0); 177ff14e315SSatish Balay } 178ff14e315SSatish Balay 1794a2ae208SSatish Balay #undef __FUNCT__ 1804a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyBegin_MPIDense" 1818f6be9afSLois Curfman McInnes int MatAssemblyBegin_MPIDense(Mat mat,MatAssemblyType mode) 1828965ea79SLois Curfman McInnes { 18339ddd567SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 1848965ea79SLois Curfman McInnes MPI_Comm comm = mat->comm; 185d36fbae8SSatish Balay int ierr,nstash,reallocs; 1868965ea79SLois Curfman McInnes InsertMode addv; 1878965ea79SLois Curfman McInnes 1883a40ed3dSBarry Smith PetscFunctionBegin; 1898965ea79SLois Curfman McInnes /* make sure all processors are either in INSERTMODE or ADDMODE */ 190ca161407SBarry Smith ierr = MPI_Allreduce(&mat->insertmode,&addv,1,MPI_INT,MPI_BOR,comm);CHKERRQ(ierr); 1917056b6fcSBarry Smith if (addv == (ADD_VALUES|INSERT_VALUES)) { 19229bbc08cSBarry Smith SETERRQ(PETSC_ERR_ARG_WRONGSTATE,"Cannot mix adds/inserts on different procs"); 1938965ea79SLois Curfman McInnes } 194e0fa3b82SLois Curfman McInnes mat->insertmode = addv; /* in case this processor had no cache */ 1958965ea79SLois Curfman McInnes 1968798bf22SSatish Balay ierr = MatStashScatterBegin_Private(&mat->stash,mdn->rowners);CHKERRQ(ierr); 1978798bf22SSatish Balay ierr = MatStashGetInfo_Private(&mat->stash,&nstash,&reallocs);CHKERRQ(ierr); 198b0a32e0cSBarry Smith PetscLogInfo(mdn->A,"MatAssemblyBegin_MPIDense:Stash has %d entries, uses %d mallocs.\n",nstash,reallocs); 1993a40ed3dSBarry Smith PetscFunctionReturn(0); 2008965ea79SLois Curfman McInnes } 2018965ea79SLois Curfman McInnes 2024a2ae208SSatish Balay #undef __FUNCT__ 2034a2ae208SSatish Balay #define __FUNCT__ "MatAssemblyEnd_MPIDense" 2048f6be9afSLois Curfman McInnes int MatAssemblyEnd_MPIDense(Mat mat,MatAssemblyType mode) 2058965ea79SLois Curfman McInnes { 20639ddd567SLois Curfman McInnes Mat_MPIDense *mdn=(Mat_MPIDense*)mat->data; 2077ef1d9bdSSatish Balay int i,n,ierr,*row,*col,flg,j,rstart,ncols; 20887828ca2SBarry Smith PetscScalar *val; 209e0fa3b82SLois Curfman McInnes InsertMode addv=mat->insertmode; 2108965ea79SLois Curfman McInnes 2113a40ed3dSBarry Smith PetscFunctionBegin; 2128965ea79SLois Curfman McInnes /* wait on receives */ 2137ef1d9bdSSatish Balay while (1) { 2148798bf22SSatish Balay ierr = MatStashScatterGetMesg_Private(&mat->stash,&n,&row,&col,&val,&flg);CHKERRQ(ierr); 2157ef1d9bdSSatish Balay if (!flg) break; 2168965ea79SLois Curfman McInnes 2177ef1d9bdSSatish Balay for (i=0; i<n;) { 2187ef1d9bdSSatish Balay /* Now identify the consecutive vals belonging to the same row */ 2197ef1d9bdSSatish Balay for (j=i,rstart=row[j]; j<n; j++) { if (row[j] != rstart) break; } 2207ef1d9bdSSatish Balay if (j < n) ncols = j-i; 2217ef1d9bdSSatish Balay else ncols = n-i; 2227ef1d9bdSSatish Balay /* Now assemble all these values with a single function call */ 2237ef1d9bdSSatish Balay ierr = MatSetValues_MPIDense(mat,1,row+i,ncols,col+i,val+i,addv);CHKERRQ(ierr); 2247ef1d9bdSSatish Balay i = j; 2258965ea79SLois Curfman McInnes } 2267ef1d9bdSSatish Balay } 2278798bf22SSatish Balay ierr = MatStashScatterEnd_Private(&mat->stash);CHKERRQ(ierr); 2288965ea79SLois Curfman McInnes 22939ddd567SLois Curfman McInnes ierr = MatAssemblyBegin(mdn->A,mode);CHKERRQ(ierr); 23039ddd567SLois Curfman McInnes ierr = MatAssemblyEnd(mdn->A,mode);CHKERRQ(ierr); 2318965ea79SLois Curfman McInnes 2326d4a8577SBarry Smith if (!mat->was_assembled && mode == MAT_FINAL_ASSEMBLY) { 23339ddd567SLois Curfman McInnes ierr = MatSetUpMultiply_MPIDense(mat);CHKERRQ(ierr); 2348965ea79SLois Curfman McInnes } 2353a40ed3dSBarry Smith PetscFunctionReturn(0); 2368965ea79SLois Curfman McInnes } 2378965ea79SLois Curfman McInnes 2384a2ae208SSatish Balay #undef __FUNCT__ 2394a2ae208SSatish Balay #define __FUNCT__ "MatZeroEntries_MPIDense" 2408f6be9afSLois Curfman McInnes int MatZeroEntries_MPIDense(Mat A) 2418965ea79SLois Curfman McInnes { 2423a40ed3dSBarry Smith int ierr; 24339ddd567SLois Curfman McInnes Mat_MPIDense *l = (Mat_MPIDense*)A->data; 2443a40ed3dSBarry Smith 2453a40ed3dSBarry Smith PetscFunctionBegin; 2463a40ed3dSBarry Smith ierr = MatZeroEntries(l->A);CHKERRQ(ierr); 2473a40ed3dSBarry Smith PetscFunctionReturn(0); 2488965ea79SLois Curfman McInnes } 2498965ea79SLois Curfman McInnes 2504a2ae208SSatish Balay #undef __FUNCT__ 2514a2ae208SSatish Balay #define __FUNCT__ "MatGetBlockSize_MPIDense" 2528f6be9afSLois Curfman McInnes int MatGetBlockSize_MPIDense(Mat A,int *bs) 2534e220ebcSLois Curfman McInnes { 2543a40ed3dSBarry Smith PetscFunctionBegin; 2554e220ebcSLois Curfman McInnes *bs = 1; 2563a40ed3dSBarry Smith PetscFunctionReturn(0); 2574e220ebcSLois Curfman McInnes } 2584e220ebcSLois Curfman McInnes 2598965ea79SLois Curfman McInnes /* the code does not do the diagonal entries correctly unless the 2608965ea79SLois Curfman McInnes matrix is square and the column and row owerships are identical. 2618965ea79SLois Curfman McInnes This is a BUG. The only way to fix it seems to be to access 2623501a2bdSLois Curfman McInnes mdn->A and mdn->B directly and not through the MatZeroRows() 2638965ea79SLois Curfman McInnes routine. 2648965ea79SLois Curfman McInnes */ 2654a2ae208SSatish Balay #undef __FUNCT__ 2664a2ae208SSatish Balay #define __FUNCT__ "MatZeroRows_MPIDense" 267268466fbSBarry Smith int MatZeroRows_MPIDense(Mat A,IS is,const PetscScalar *diag) 2688965ea79SLois Curfman McInnes { 26939ddd567SLois Curfman McInnes Mat_MPIDense *l = (Mat_MPIDense*)A->data; 2708965ea79SLois Curfman McInnes int i,ierr,N,*rows,*owners = l->rowners,size = l->size; 271c1dc657dSBarry Smith int *nprocs,j,idx,nsends; 2728965ea79SLois Curfman McInnes int nmax,*svalues,*starts,*owner,nrecvs,rank = l->rank; 2738965ea79SLois Curfman McInnes int *rvalues,tag = A->tag,count,base,slen,n,*source; 2748965ea79SLois Curfman McInnes int *lens,imdex,*lrows,*values; 2758965ea79SLois Curfman McInnes MPI_Comm comm = A->comm; 2768965ea79SLois Curfman McInnes MPI_Request *send_waits,*recv_waits; 2778965ea79SLois Curfman McInnes MPI_Status recv_status,*send_status; 2788965ea79SLois Curfman McInnes IS istmp; 27935d8aa7fSBarry Smith PetscTruth found; 2808965ea79SLois Curfman McInnes 2813a40ed3dSBarry Smith PetscFunctionBegin; 282b9b97703SBarry Smith ierr = ISGetLocalSize(is,&N);CHKERRQ(ierr); 2838965ea79SLois Curfman McInnes ierr = ISGetIndices(is,&rows);CHKERRQ(ierr); 2848965ea79SLois Curfman McInnes 2858965ea79SLois Curfman McInnes /* first count number of contributors to each processor */ 286b0a32e0cSBarry Smith ierr = PetscMalloc(2*size*sizeof(int),&nprocs);CHKERRQ(ierr); 287549d3d68SSatish Balay ierr = PetscMemzero(nprocs,2*size*sizeof(int));CHKERRQ(ierr); 288b0a32e0cSBarry Smith ierr = PetscMalloc((N+1)*sizeof(int),&owner);CHKERRQ(ierr); /* see note*/ 2898965ea79SLois Curfman McInnes for (i=0; i<N; i++) { 2908965ea79SLois Curfman McInnes idx = rows[i]; 29135d8aa7fSBarry Smith found = PETSC_FALSE; 2928965ea79SLois Curfman McInnes for (j=0; j<size; j++) { 2938965ea79SLois Curfman McInnes if (idx >= owners[j] && idx < owners[j+1]) { 294c1dc657dSBarry Smith nprocs[2*j]++; nprocs[2*j+1] = 1; owner[i] = j; found = PETSC_TRUE; break; 2958965ea79SLois Curfman McInnes } 2968965ea79SLois Curfman McInnes } 29729bbc08cSBarry Smith if (!found) SETERRQ(PETSC_ERR_ARG_OUTOFRANGE,"Index out of range"); 2988965ea79SLois Curfman McInnes } 299c1dc657dSBarry Smith nsends = 0; for (i=0; i<size; i++) { nsends += nprocs[2*i+1];} 3008965ea79SLois Curfman McInnes 3018965ea79SLois Curfman McInnes /* inform other processors of number of messages and max length*/ 302c1dc657dSBarry Smith ierr = PetscMaxSum(comm,nprocs,&nmax,&nrecvs);CHKERRQ(ierr); 3038965ea79SLois Curfman McInnes 3048965ea79SLois Curfman McInnes /* post receives: */ 305b0a32e0cSBarry Smith ierr = PetscMalloc((nrecvs+1)*(nmax+1)*sizeof(int),&rvalues);CHKERRQ(ierr); 306b0a32e0cSBarry Smith ierr = PetscMalloc((nrecvs+1)*sizeof(MPI_Request),&recv_waits);CHKERRQ(ierr); 3078965ea79SLois Curfman McInnes for (i=0; i<nrecvs; i++) { 308ca161407SBarry Smith ierr = MPI_Irecv(rvalues+nmax*i,nmax,MPI_INT,MPI_ANY_SOURCE,tag,comm,recv_waits+i);CHKERRQ(ierr); 3098965ea79SLois Curfman McInnes } 3108965ea79SLois Curfman McInnes 3118965ea79SLois Curfman McInnes /* do sends: 3128965ea79SLois Curfman McInnes 1) starts[i] gives the starting index in svalues for stuff going to 3138965ea79SLois Curfman McInnes the ith processor 3148965ea79SLois Curfman McInnes */ 315b0a32e0cSBarry Smith ierr = PetscMalloc((N+1)*sizeof(int),&svalues);CHKERRQ(ierr); 316b0a32e0cSBarry Smith ierr = PetscMalloc((nsends+1)*sizeof(MPI_Request),&send_waits);CHKERRQ(ierr); 317b0a32e0cSBarry Smith ierr = PetscMalloc((size+1)*sizeof(int),&starts);CHKERRQ(ierr); 3188965ea79SLois Curfman McInnes starts[0] = 0; 319c1dc657dSBarry Smith for (i=1; i<size; i++) { starts[i] = starts[i-1] + nprocs[2*i-2];} 3208965ea79SLois Curfman McInnes for (i=0; i<N; i++) { 3218965ea79SLois Curfman McInnes svalues[starts[owner[i]]++] = rows[i]; 3228965ea79SLois Curfman McInnes } 3238965ea79SLois Curfman McInnes ISRestoreIndices(is,&rows); 3248965ea79SLois Curfman McInnes 3258965ea79SLois Curfman McInnes starts[0] = 0; 326c1dc657dSBarry Smith for (i=1; i<size+1; i++) { starts[i] = starts[i-1] + nprocs[2*i-2];} 3278965ea79SLois Curfman McInnes count = 0; 3288965ea79SLois Curfman McInnes for (i=0; i<size; i++) { 329c1dc657dSBarry Smith if (nprocs[2*i+1]) { 330c1dc657dSBarry Smith ierr = MPI_Isend(svalues+starts[i],nprocs[2*i],MPI_INT,i,tag,comm,send_waits+count++);CHKERRQ(ierr); 3318965ea79SLois Curfman McInnes } 3328965ea79SLois Curfman McInnes } 333606d414cSSatish Balay ierr = PetscFree(starts);CHKERRQ(ierr); 3348965ea79SLois Curfman McInnes 3358965ea79SLois Curfman McInnes base = owners[rank]; 3368965ea79SLois Curfman McInnes 3378965ea79SLois Curfman McInnes /* wait on receives */ 338b0a32e0cSBarry Smith ierr = PetscMalloc(2*(nrecvs+1)*sizeof(int),&lens);CHKERRQ(ierr); 3398965ea79SLois Curfman McInnes source = lens + nrecvs; 3408965ea79SLois Curfman McInnes count = nrecvs; slen = 0; 3418965ea79SLois Curfman McInnes while (count) { 342ca161407SBarry Smith ierr = MPI_Waitany(nrecvs,recv_waits,&imdex,&recv_status);CHKERRQ(ierr); 3438965ea79SLois Curfman McInnes /* unpack receives into our local space */ 344ca161407SBarry Smith ierr = MPI_Get_count(&recv_status,MPI_INT,&n);CHKERRQ(ierr); 3458965ea79SLois Curfman McInnes source[imdex] = recv_status.MPI_SOURCE; 3468965ea79SLois Curfman McInnes lens[imdex] = n; 3478965ea79SLois Curfman McInnes slen += n; 3488965ea79SLois Curfman McInnes count--; 3498965ea79SLois Curfman McInnes } 350606d414cSSatish Balay ierr = PetscFree(recv_waits);CHKERRQ(ierr); 3518965ea79SLois Curfman McInnes 3528965ea79SLois Curfman McInnes /* move the data into the send scatter */ 353b0a32e0cSBarry Smith ierr = PetscMalloc((slen+1)*sizeof(int),&lrows);CHKERRQ(ierr); 3548965ea79SLois Curfman McInnes count = 0; 3558965ea79SLois Curfman McInnes for (i=0; i<nrecvs; i++) { 3568965ea79SLois Curfman McInnes values = rvalues + i*nmax; 3578965ea79SLois Curfman McInnes for (j=0; j<lens[i]; j++) { 3588965ea79SLois Curfman McInnes lrows[count++] = values[j] - base; 3598965ea79SLois Curfman McInnes } 3608965ea79SLois Curfman McInnes } 361606d414cSSatish Balay ierr = PetscFree(rvalues);CHKERRQ(ierr); 362606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 363606d414cSSatish Balay ierr = PetscFree(owner);CHKERRQ(ierr); 364606d414cSSatish Balay ierr = PetscFree(nprocs);CHKERRQ(ierr); 3658965ea79SLois Curfman McInnes 3668965ea79SLois Curfman McInnes /* actually zap the local rows */ 367029af93fSBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,slen,lrows,&istmp);CHKERRQ(ierr); 368b0a32e0cSBarry Smith PetscLogObjectParent(A,istmp); 369606d414cSSatish Balay ierr = PetscFree(lrows);CHKERRQ(ierr); 3708965ea79SLois Curfman McInnes ierr = MatZeroRows(l->A,istmp,diag);CHKERRQ(ierr); 3718965ea79SLois Curfman McInnes ierr = ISDestroy(istmp);CHKERRQ(ierr); 3728965ea79SLois Curfman McInnes 3738965ea79SLois Curfman McInnes /* wait on sends */ 3748965ea79SLois Curfman McInnes if (nsends) { 375b0a32e0cSBarry Smith ierr = PetscMalloc(nsends*sizeof(MPI_Status),&send_status);CHKERRQ(ierr); 376ca161407SBarry Smith ierr = MPI_Waitall(nsends,send_waits,send_status);CHKERRQ(ierr); 377606d414cSSatish Balay ierr = PetscFree(send_status);CHKERRQ(ierr); 3788965ea79SLois Curfman McInnes } 379606d414cSSatish Balay ierr = PetscFree(send_waits);CHKERRQ(ierr); 380606d414cSSatish Balay ierr = PetscFree(svalues);CHKERRQ(ierr); 3818965ea79SLois Curfman McInnes 3823a40ed3dSBarry Smith PetscFunctionReturn(0); 3838965ea79SLois Curfman McInnes } 3848965ea79SLois Curfman McInnes 3854a2ae208SSatish Balay #undef __FUNCT__ 3864a2ae208SSatish Balay #define __FUNCT__ "MatMult_MPIDense" 3878f6be9afSLois Curfman McInnes int MatMult_MPIDense(Mat mat,Vec xx,Vec yy) 3888965ea79SLois Curfman McInnes { 38939ddd567SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 3908965ea79SLois Curfman McInnes int ierr; 391c456f294SBarry Smith 3923a40ed3dSBarry Smith PetscFunctionBegin; 39343a90d84SBarry Smith ierr = VecScatterBegin(xx,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 39443a90d84SBarry Smith ierr = VecScatterEnd(xx,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 39544cd7ae7SLois Curfman McInnes ierr = MatMult_SeqDense(mdn->A,mdn->lvec,yy);CHKERRQ(ierr); 3963a40ed3dSBarry Smith PetscFunctionReturn(0); 3978965ea79SLois Curfman McInnes } 3988965ea79SLois Curfman McInnes 3994a2ae208SSatish Balay #undef __FUNCT__ 4004a2ae208SSatish Balay #define __FUNCT__ "MatMultAdd_MPIDense" 4018f6be9afSLois Curfman McInnes int MatMultAdd_MPIDense(Mat mat,Vec xx,Vec yy,Vec zz) 4028965ea79SLois Curfman McInnes { 40339ddd567SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 4048965ea79SLois Curfman McInnes int ierr; 405c456f294SBarry Smith 4063a40ed3dSBarry Smith PetscFunctionBegin; 40743a90d84SBarry Smith ierr = VecScatterBegin(xx,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 40843a90d84SBarry Smith ierr = VecScatterEnd(xx,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 40944cd7ae7SLois Curfman McInnes ierr = MatMultAdd_SeqDense(mdn->A,mdn->lvec,yy,zz);CHKERRQ(ierr); 4103a40ed3dSBarry Smith PetscFunctionReturn(0); 4118965ea79SLois Curfman McInnes } 4128965ea79SLois Curfman McInnes 4134a2ae208SSatish Balay #undef __FUNCT__ 4144a2ae208SSatish Balay #define __FUNCT__ "MatMultTranspose_MPIDense" 4157c922b88SBarry Smith int MatMultTranspose_MPIDense(Mat A,Vec xx,Vec yy) 416096963f5SLois Curfman McInnes { 417096963f5SLois Curfman McInnes Mat_MPIDense *a = (Mat_MPIDense*)A->data; 418096963f5SLois Curfman McInnes int ierr; 41987828ca2SBarry Smith PetscScalar zero = 0.0; 420096963f5SLois Curfman McInnes 4213a40ed3dSBarry Smith PetscFunctionBegin; 4223501a2bdSLois Curfman McInnes ierr = VecSet(&zero,yy);CHKERRQ(ierr); 4237c922b88SBarry Smith ierr = MatMultTranspose_SeqDense(a->A,xx,a->lvec);CHKERRQ(ierr); 424537820f0SBarry Smith ierr = VecScatterBegin(a->lvec,yy,ADD_VALUES,SCATTER_REVERSE,a->Mvctx);CHKERRQ(ierr); 425537820f0SBarry Smith ierr = VecScatterEnd(a->lvec,yy,ADD_VALUES,SCATTER_REVERSE,a->Mvctx);CHKERRQ(ierr); 4263a40ed3dSBarry Smith PetscFunctionReturn(0); 427096963f5SLois Curfman McInnes } 428096963f5SLois Curfman McInnes 4294a2ae208SSatish Balay #undef __FUNCT__ 4304a2ae208SSatish Balay #define __FUNCT__ "MatMultTransposeAdd_MPIDense" 4317c922b88SBarry Smith int MatMultTransposeAdd_MPIDense(Mat A,Vec xx,Vec yy,Vec zz) 432096963f5SLois Curfman McInnes { 433096963f5SLois Curfman McInnes Mat_MPIDense *a = (Mat_MPIDense*)A->data; 434096963f5SLois Curfman McInnes int ierr; 435096963f5SLois Curfman McInnes 4363a40ed3dSBarry Smith PetscFunctionBegin; 4373501a2bdSLois Curfman McInnes ierr = VecCopy(yy,zz);CHKERRQ(ierr); 4387c922b88SBarry Smith ierr = MatMultTranspose_SeqDense(a->A,xx,a->lvec);CHKERRQ(ierr); 439537820f0SBarry Smith ierr = VecScatterBegin(a->lvec,zz,ADD_VALUES,SCATTER_REVERSE,a->Mvctx);CHKERRQ(ierr); 440537820f0SBarry Smith ierr = VecScatterEnd(a->lvec,zz,ADD_VALUES,SCATTER_REVERSE,a->Mvctx);CHKERRQ(ierr); 4413a40ed3dSBarry Smith PetscFunctionReturn(0); 442096963f5SLois Curfman McInnes } 443096963f5SLois Curfman McInnes 4444a2ae208SSatish Balay #undef __FUNCT__ 4454a2ae208SSatish Balay #define __FUNCT__ "MatGetDiagonal_MPIDense" 4468f6be9afSLois Curfman McInnes int MatGetDiagonal_MPIDense(Mat A,Vec v) 4478965ea79SLois Curfman McInnes { 44839ddd567SLois Curfman McInnes Mat_MPIDense *a = (Mat_MPIDense*)A->data; 449096963f5SLois Curfman McInnes Mat_SeqDense *aloc = (Mat_SeqDense*)a->A->data; 450273d9f13SBarry Smith int ierr,len,i,n,m = A->m,radd; 45187828ca2SBarry Smith PetscScalar *x,zero = 0.0; 452ed3cc1f0SBarry Smith 4533a40ed3dSBarry Smith PetscFunctionBegin; 454273d9f13SBarry Smith ierr = VecSet(&zero,v);CHKERRQ(ierr); 455b1d4fb26SBarry Smith ierr = VecGetArrayFast(v,&x);CHKERRQ(ierr); 456096963f5SLois Curfman McInnes ierr = VecGetSize(v,&n);CHKERRQ(ierr); 457273d9f13SBarry Smith if (n != A->M) SETERRQ(PETSC_ERR_ARG_SIZ,"Nonconforming mat and vec"); 458273d9f13SBarry Smith len = PetscMin(a->A->m,a->A->n); 4597ddc982cSLois Curfman McInnes radd = a->rstart*m; 46044cd7ae7SLois Curfman McInnes for (i=0; i<len; i++) { 461096963f5SLois Curfman McInnes x[i] = aloc->v[radd + i*m + i]; 462096963f5SLois Curfman McInnes } 463b1d4fb26SBarry Smith ierr = VecRestoreArrayFast(v,&x);CHKERRQ(ierr); 4643a40ed3dSBarry Smith PetscFunctionReturn(0); 4658965ea79SLois Curfman McInnes } 4668965ea79SLois Curfman McInnes 4674a2ae208SSatish Balay #undef __FUNCT__ 4684a2ae208SSatish Balay #define __FUNCT__ "MatDestroy_MPIDense" 469e1311b90SBarry Smith int MatDestroy_MPIDense(Mat mat) 4708965ea79SLois Curfman McInnes { 4713501a2bdSLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 4728965ea79SLois Curfman McInnes int ierr; 473ed3cc1f0SBarry Smith 4743a40ed3dSBarry Smith PetscFunctionBegin; 47594d884c6SBarry Smith 476aa482453SBarry Smith #if defined(PETSC_USE_LOG) 477b0a32e0cSBarry Smith PetscLogObjectState((PetscObject)mat,"Rows=%d, Cols=%d",mat->M,mat->N); 4788965ea79SLois Curfman McInnes #endif 4798798bf22SSatish Balay ierr = MatStashDestroy_Private(&mat->stash);CHKERRQ(ierr); 480606d414cSSatish Balay ierr = PetscFree(mdn->rowners);CHKERRQ(ierr); 4813501a2bdSLois Curfman McInnes ierr = MatDestroy(mdn->A);CHKERRQ(ierr); 4823501a2bdSLois Curfman McInnes if (mdn->lvec) VecDestroy(mdn->lvec); 4833501a2bdSLois Curfman McInnes if (mdn->Mvctx) VecScatterDestroy(mdn->Mvctx); 484622d7880SLois Curfman McInnes if (mdn->factor) { 485606d414cSSatish Balay if (mdn->factor->temp) {ierr = PetscFree(mdn->factor->temp);CHKERRQ(ierr);} 486606d414cSSatish Balay if (mdn->factor->tag) {ierr = PetscFree(mdn->factor->tag);CHKERRQ(ierr);} 487606d414cSSatish Balay if (mdn->factor->pivots) {ierr = PetscFree(mdn->factor->pivots);CHKERRQ(ierr);} 488606d414cSSatish Balay ierr = PetscFree(mdn->factor);CHKERRQ(ierr); 489622d7880SLois Curfman McInnes } 490606d414cSSatish Balay ierr = PetscFree(mdn);CHKERRQ(ierr); 4913a40ed3dSBarry Smith PetscFunctionReturn(0); 4928965ea79SLois Curfman McInnes } 49339ddd567SLois Curfman McInnes 4944a2ae208SSatish Balay #undef __FUNCT__ 4954a2ae208SSatish Balay #define __FUNCT__ "MatView_MPIDense_Binary" 496b0a32e0cSBarry Smith static int MatView_MPIDense_Binary(Mat mat,PetscViewer viewer) 4978965ea79SLois Curfman McInnes { 49839ddd567SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 4998965ea79SLois Curfman McInnes int ierr; 5007056b6fcSBarry Smith 5013a40ed3dSBarry Smith PetscFunctionBegin; 50239ddd567SLois Curfman McInnes if (mdn->size == 1) { 50339ddd567SLois Curfman McInnes ierr = MatView(mdn->A,viewer);CHKERRQ(ierr); 5048965ea79SLois Curfman McInnes } 50529bbc08cSBarry Smith else SETERRQ(PETSC_ERR_SUP,"Only uniprocessor output supported"); 5063a40ed3dSBarry Smith PetscFunctionReturn(0); 5078965ea79SLois Curfman McInnes } 5088965ea79SLois Curfman McInnes 5094a2ae208SSatish Balay #undef __FUNCT__ 5104a2ae208SSatish Balay #define __FUNCT__ "MatView_MPIDense_ASCIIorDraworSocket" 511b0a32e0cSBarry Smith static int MatView_MPIDense_ASCIIorDraworSocket(Mat mat,PetscViewer viewer) 5128965ea79SLois Curfman McInnes { 51339ddd567SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)mat->data; 514fb9695e5SSatish Balay int ierr,size = mdn->size,rank = mdn->rank; 515b0a32e0cSBarry Smith PetscViewerType vtype; 516f1af5d2fSBarry Smith PetscTruth isascii,isdraw; 517b0a32e0cSBarry Smith PetscViewer sviewer; 518f3ef73ceSBarry Smith PetscViewerFormat format; 5198965ea79SLois Curfman McInnes 5203a40ed3dSBarry Smith PetscFunctionBegin; 521b0a32e0cSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&isascii);CHKERRQ(ierr); 522fb9695e5SSatish Balay ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_DRAW,&isdraw);CHKERRQ(ierr); 523f1af5d2fSBarry Smith if (isascii) { 524b0a32e0cSBarry Smith ierr = PetscViewerGetType(viewer,&vtype);CHKERRQ(ierr); 525b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 526456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 5274e220ebcSLois Curfman McInnes MatInfo info; 528888f2ed8SSatish Balay ierr = MatGetInfo(mat,MAT_LOCAL,&info);CHKERRQ(ierr); 529b0a32e0cSBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] local rows %d nz %d nz alloced %d mem %d \n",rank,mat->m, 5306831982aSBarry Smith (int)info.nz_used,(int)info.nz_allocated,(int)info.memory);CHKERRQ(ierr); 531b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 5323501a2bdSLois Curfman McInnes ierr = VecScatterView(mdn->Mvctx,viewer);CHKERRQ(ierr); 5333a40ed3dSBarry Smith PetscFunctionReturn(0); 534fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_INFO) { 5353a40ed3dSBarry Smith PetscFunctionReturn(0); 5368965ea79SLois Curfman McInnes } 537f1af5d2fSBarry Smith } else if (isdraw) { 538b0a32e0cSBarry Smith PetscDraw draw; 539f1af5d2fSBarry Smith PetscTruth isnull; 540f1af5d2fSBarry Smith 541b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 542b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 543f1af5d2fSBarry Smith if (isnull) PetscFunctionReturn(0); 544f1af5d2fSBarry Smith } 54577ed5343SBarry Smith 5468965ea79SLois Curfman McInnes if (size == 1) { 54739ddd567SLois Curfman McInnes ierr = MatView(mdn->A,viewer);CHKERRQ(ierr); 5483a40ed3dSBarry Smith } else { 5498965ea79SLois Curfman McInnes /* assemble the entire matrix onto first processor. */ 5508965ea79SLois Curfman McInnes Mat A; 551273d9f13SBarry Smith int M = mat->M,N = mat->N,m,row,i,nz,*cols; 55287828ca2SBarry Smith PetscScalar *vals; 5538965ea79SLois Curfman McInnes 5548965ea79SLois Curfman McInnes if (!rank) { 555878740d9SKris Buschelman ierr = MatCreate(mat->comm,M,N,M,N,&A);CHKERRQ(ierr); 5563a40ed3dSBarry Smith } else { 557878740d9SKris Buschelman ierr = MatCreate(mat->comm,0,0,M,N,&A);CHKERRQ(ierr); 5588965ea79SLois Curfman McInnes } 559*be5d1d56SKris Buschelman /* Since this is a temporary matrix, MATMPIDENSE instead of A->type_name here is probably acceptable. */ 560878740d9SKris Buschelman ierr = MatSetType(A,MATMPIDENSE);CHKERRQ(ierr); 561878740d9SKris Buschelman ierr = MatMPIDenseSetPreallocation(A,PETSC_NULL); 562b0a32e0cSBarry Smith PetscLogObjectParent(mat,A); 5638965ea79SLois Curfman McInnes 56439ddd567SLois Curfman McInnes /* Copy the matrix ... This isn't the most efficient means, 56539ddd567SLois Curfman McInnes but it's quick for now */ 566273d9f13SBarry Smith row = mdn->rstart; m = mdn->A->m; 5678965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 56839ddd567SLois Curfman McInnes ierr = MatGetRow(mat,row,&nz,&cols,&vals);CHKERRQ(ierr); 56939ddd567SLois Curfman McInnes ierr = MatSetValues(A,1,&row,nz,cols,vals,INSERT_VALUES);CHKERRQ(ierr); 57039ddd567SLois Curfman McInnes ierr = MatRestoreRow(mat,row,&nz,&cols,&vals);CHKERRQ(ierr); 57139ddd567SLois Curfman McInnes row++; 5728965ea79SLois Curfman McInnes } 5738965ea79SLois Curfman McInnes 5746d4a8577SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 5756d4a8577SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 576b0a32e0cSBarry Smith ierr = PetscViewerGetSingleton(viewer,&sviewer);CHKERRQ(ierr); 577b9b97703SBarry Smith if (!rank) { 5786831982aSBarry Smith ierr = MatView(((Mat_MPIDense*)(A->data))->A,sviewer);CHKERRQ(ierr); 5798965ea79SLois Curfman McInnes } 580b0a32e0cSBarry Smith ierr = PetscViewerRestoreSingleton(viewer,&sviewer);CHKERRQ(ierr); 581b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 5828965ea79SLois Curfman McInnes ierr = MatDestroy(A);CHKERRQ(ierr); 5838965ea79SLois Curfman McInnes } 5843a40ed3dSBarry Smith PetscFunctionReturn(0); 5858965ea79SLois Curfman McInnes } 5868965ea79SLois Curfman McInnes 5874a2ae208SSatish Balay #undef __FUNCT__ 5884a2ae208SSatish Balay #define __FUNCT__ "MatView_MPIDense" 589b0a32e0cSBarry Smith int MatView_MPIDense(Mat mat,PetscViewer viewer) 5908965ea79SLois Curfman McInnes { 59139ddd567SLois Curfman McInnes int ierr; 592f1af5d2fSBarry Smith PetscTruth isascii,isbinary,isdraw,issocket; 5938965ea79SLois Curfman McInnes 594433994e6SBarry Smith PetscFunctionBegin; 5950f5bd95cSBarry Smith 596b0a32e0cSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&isascii);CHKERRQ(ierr); 597fb9695e5SSatish Balay ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_BINARY,&isbinary);CHKERRQ(ierr); 598b0a32e0cSBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_SOCKET,&issocket);CHKERRQ(ierr); 599fb9695e5SSatish Balay ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_DRAW,&isdraw);CHKERRQ(ierr); 6000f5bd95cSBarry Smith 601f1af5d2fSBarry Smith if (isascii || issocket || isdraw) { 602f1af5d2fSBarry Smith ierr = MatView_MPIDense_ASCIIorDraworSocket(mat,viewer);CHKERRQ(ierr); 6030f5bd95cSBarry Smith } else if (isbinary) { 6043a40ed3dSBarry Smith ierr = MatView_MPIDense_Binary(mat,viewer);CHKERRQ(ierr); 6055cd90555SBarry Smith } else { 60629bbc08cSBarry Smith SETERRQ1(1,"Viewer type %s not supported by MPI dense matrix",((PetscObject)viewer)->type_name); 6078965ea79SLois Curfman McInnes } 6083a40ed3dSBarry Smith PetscFunctionReturn(0); 6098965ea79SLois Curfman McInnes } 6108965ea79SLois Curfman McInnes 6114a2ae208SSatish Balay #undef __FUNCT__ 6124a2ae208SSatish Balay #define __FUNCT__ "MatGetInfo_MPIDense" 6138f6be9afSLois Curfman McInnes int MatGetInfo_MPIDense(Mat A,MatInfoType flag,MatInfo *info) 6148965ea79SLois Curfman McInnes { 6153501a2bdSLois Curfman McInnes Mat_MPIDense *mat = (Mat_MPIDense*)A->data; 6163501a2bdSLois Curfman McInnes Mat mdn = mat->A; 6174e220ebcSLois Curfman McInnes int ierr; 618329f5518SBarry Smith PetscReal isend[5],irecv[5]; 6198965ea79SLois Curfman McInnes 6203a40ed3dSBarry Smith PetscFunctionBegin; 621273d9f13SBarry Smith info->rows_global = (double)A->M; 622273d9f13SBarry Smith info->columns_global = (double)A->N; 623273d9f13SBarry Smith info->rows_local = (double)A->m; 624273d9f13SBarry Smith info->columns_local = (double)A->N; 6254e220ebcSLois Curfman McInnes info->block_size = 1.0; 6264e220ebcSLois Curfman McInnes ierr = MatGetInfo(mdn,MAT_LOCAL,info);CHKERRQ(ierr); 6274e220ebcSLois Curfman McInnes isend[0] = info->nz_used; isend[1] = info->nz_allocated; isend[2] = info->nz_unneeded; 6284e220ebcSLois Curfman McInnes isend[3] = info->memory; isend[4] = info->mallocs; 6298965ea79SLois Curfman McInnes if (flag == MAT_LOCAL) { 6304e220ebcSLois Curfman McInnes info->nz_used = isend[0]; 6314e220ebcSLois Curfman McInnes info->nz_allocated = isend[1]; 6324e220ebcSLois Curfman McInnes info->nz_unneeded = isend[2]; 6334e220ebcSLois Curfman McInnes info->memory = isend[3]; 6344e220ebcSLois Curfman McInnes info->mallocs = isend[4]; 6358965ea79SLois Curfman McInnes } else if (flag == MAT_GLOBAL_MAX) { 636d7d1e502SBarry Smith ierr = MPI_Allreduce(isend,irecv,5,MPIU_REAL,MPI_MAX,A->comm);CHKERRQ(ierr); 6374e220ebcSLois Curfman McInnes info->nz_used = irecv[0]; 6384e220ebcSLois Curfman McInnes info->nz_allocated = irecv[1]; 6394e220ebcSLois Curfman McInnes info->nz_unneeded = irecv[2]; 6404e220ebcSLois Curfman McInnes info->memory = irecv[3]; 6414e220ebcSLois Curfman McInnes info->mallocs = irecv[4]; 6428965ea79SLois Curfman McInnes } else if (flag == MAT_GLOBAL_SUM) { 643d7d1e502SBarry Smith ierr = MPI_Allreduce(isend,irecv,5,MPIU_REAL,MPI_SUM,A->comm);CHKERRQ(ierr); 6444e220ebcSLois Curfman McInnes info->nz_used = irecv[0]; 6454e220ebcSLois Curfman McInnes info->nz_allocated = irecv[1]; 6464e220ebcSLois Curfman McInnes info->nz_unneeded = irecv[2]; 6474e220ebcSLois Curfman McInnes info->memory = irecv[3]; 6484e220ebcSLois Curfman McInnes info->mallocs = irecv[4]; 6498965ea79SLois Curfman McInnes } 6504e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; /* no parallel LU/ILU/Cholesky */ 6514e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 6524e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 6533a40ed3dSBarry Smith PetscFunctionReturn(0); 6548965ea79SLois Curfman McInnes } 6558965ea79SLois Curfman McInnes 6564a2ae208SSatish Balay #undef __FUNCT__ 6574a2ae208SSatish Balay #define __FUNCT__ "MatSetOption_MPIDense" 6588f6be9afSLois Curfman McInnes int MatSetOption_MPIDense(Mat A,MatOption op) 6598965ea79SLois Curfman McInnes { 66039ddd567SLois Curfman McInnes Mat_MPIDense *a = (Mat_MPIDense*)A->data; 661273d9f13SBarry Smith int ierr; 6628965ea79SLois Curfman McInnes 6633a40ed3dSBarry Smith PetscFunctionBegin; 66412c028f9SKris Buschelman switch (op) { 66512c028f9SKris Buschelman case MAT_NO_NEW_NONZERO_LOCATIONS: 66612c028f9SKris Buschelman case MAT_YES_NEW_NONZERO_LOCATIONS: 66712c028f9SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 66812c028f9SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 66912c028f9SKris Buschelman case MAT_COLUMNS_SORTED: 67012c028f9SKris Buschelman case MAT_COLUMNS_UNSORTED: 671273d9f13SBarry Smith ierr = MatSetOption(a->A,op);CHKERRQ(ierr); 67212c028f9SKris Buschelman break; 67312c028f9SKris Buschelman case MAT_ROW_ORIENTED: 674273d9f13SBarry Smith a->roworiented = PETSC_TRUE; 675273d9f13SBarry Smith ierr = MatSetOption(a->A,op);CHKERRQ(ierr); 67612c028f9SKris Buschelman break; 67712c028f9SKris Buschelman case MAT_ROWS_SORTED: 67812c028f9SKris Buschelman case MAT_ROWS_UNSORTED: 67912c028f9SKris Buschelman case MAT_YES_NEW_DIAGONALS: 68012c028f9SKris Buschelman case MAT_USE_HASH_TABLE: 681b0a32e0cSBarry Smith PetscLogInfo(A,"MatSetOption_MPIDense:Option ignored\n"); 68212c028f9SKris Buschelman break; 68312c028f9SKris Buschelman case MAT_COLUMN_ORIENTED: 684273d9f13SBarry Smith a->roworiented = PETSC_FALSE; 685273d9f13SBarry Smith ierr = MatSetOption(a->A,op);CHKERRQ(ierr); 68612c028f9SKris Buschelman break; 68712c028f9SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 688273d9f13SBarry Smith a->donotstash = PETSC_TRUE; 68912c028f9SKris Buschelman break; 69012c028f9SKris Buschelman case MAT_NO_NEW_DIAGONALS: 69129bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"MAT_NO_NEW_DIAGONALS"); 69277e54ba9SKris Buschelman case MAT_SYMMETRIC: 69377e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 6949a4540c5SBarry Smith case MAT_NOT_SYMMETRIC: 6959a4540c5SBarry Smith case MAT_NOT_STRUCTURALLY_SYMMETRIC: 6969a4540c5SBarry Smith case MAT_HERMITIAN: 6979a4540c5SBarry Smith case MAT_NOT_HERMITIAN: 6989a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 6999a4540c5SBarry Smith case MAT_NOT_SYMMETRY_ETERNAL: 70077e54ba9SKris Buschelman break; 70112c028f9SKris Buschelman default: 70229bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"unknown option"); 7033a40ed3dSBarry Smith } 7043a40ed3dSBarry Smith PetscFunctionReturn(0); 7058965ea79SLois Curfman McInnes } 7068965ea79SLois Curfman McInnes 7074a2ae208SSatish Balay #undef __FUNCT__ 7084a2ae208SSatish Balay #define __FUNCT__ "MatGetRow_MPIDense" 70987828ca2SBarry Smith int MatGetRow_MPIDense(Mat A,int row,int *nz,int **idx,PetscScalar **v) 7108965ea79SLois Curfman McInnes { 7113501a2bdSLois Curfman McInnes Mat_MPIDense *mat = (Mat_MPIDense*)A->data; 7123a40ed3dSBarry Smith int lrow,rstart = mat->rstart,rend = mat->rend,ierr; 7138965ea79SLois Curfman McInnes 7143a40ed3dSBarry Smith PetscFunctionBegin; 71529bbc08cSBarry Smith if (row < rstart || row >= rend) SETERRQ(PETSC_ERR_SUP,"only local rows") 7168965ea79SLois Curfman McInnes lrow = row - rstart; 7173a40ed3dSBarry Smith ierr = MatGetRow(mat->A,lrow,nz,idx,v);CHKERRQ(ierr); 7183a40ed3dSBarry Smith PetscFunctionReturn(0); 7198965ea79SLois Curfman McInnes } 7208965ea79SLois Curfman McInnes 7214a2ae208SSatish Balay #undef __FUNCT__ 7224a2ae208SSatish Balay #define __FUNCT__ "MatRestoreRow_MPIDense" 72387828ca2SBarry Smith int MatRestoreRow_MPIDense(Mat mat,int row,int *nz,int **idx,PetscScalar **v) 7248965ea79SLois Curfman McInnes { 725606d414cSSatish Balay int ierr; 726606d414cSSatish Balay 7273a40ed3dSBarry Smith PetscFunctionBegin; 728606d414cSSatish Balay if (idx) {ierr = PetscFree(*idx);CHKERRQ(ierr);} 729606d414cSSatish Balay if (v) {ierr = PetscFree(*v);CHKERRQ(ierr);} 7303a40ed3dSBarry Smith PetscFunctionReturn(0); 7318965ea79SLois Curfman McInnes } 7328965ea79SLois Curfman McInnes 7334a2ae208SSatish Balay #undef __FUNCT__ 7344a2ae208SSatish Balay #define __FUNCT__ "MatDiagonalScale_MPIDense" 7355b2fa520SLois Curfman McInnes int MatDiagonalScale_MPIDense(Mat A,Vec ll,Vec rr) 7365b2fa520SLois Curfman McInnes { 7375b2fa520SLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)A->data; 7385b2fa520SLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)mdn->A->data; 73987828ca2SBarry Smith PetscScalar *l,*r,x,*v; 740273d9f13SBarry Smith int ierr,i,j,s2a,s3a,s2,s3,m=mdn->A->m,n=mdn->A->n; 7415b2fa520SLois Curfman McInnes 7425b2fa520SLois Curfman McInnes PetscFunctionBegin; 74372d926a5SLois Curfman McInnes ierr = MatGetLocalSize(A,&s2,&s3);CHKERRQ(ierr); 7445b2fa520SLois Curfman McInnes if (ll) { 74572d926a5SLois Curfman McInnes ierr = VecGetLocalSize(ll,&s2a);CHKERRQ(ierr); 74629bbc08cSBarry Smith if (s2a != s2) SETERRQ(PETSC_ERR_ARG_SIZ,"Left scaling vector non-conforming local size"); 747b1d4fb26SBarry Smith ierr = VecGetArrayFast(ll,&l);CHKERRQ(ierr); 7485b2fa520SLois Curfman McInnes for (i=0; i<m; i++) { 7495b2fa520SLois Curfman McInnes x = l[i]; 7505b2fa520SLois Curfman McInnes v = mat->v + i; 7515b2fa520SLois Curfman McInnes for (j=0; j<n; j++) { (*v) *= x; v+= m;} 7525b2fa520SLois Curfman McInnes } 753b1d4fb26SBarry Smith ierr = VecRestoreArrayFast(ll,&l);CHKERRQ(ierr); 754b0a32e0cSBarry Smith PetscLogFlops(n*m); 7555b2fa520SLois Curfman McInnes } 7565b2fa520SLois Curfman McInnes if (rr) { 75772d926a5SLois Curfman McInnes ierr = VecGetSize(rr,&s3a);CHKERRQ(ierr); 75829bbc08cSBarry Smith if (s3a != s3) SETERRQ(PETSC_ERR_ARG_SIZ,"Right scaling vec non-conforming local size"); 7595b2fa520SLois Curfman McInnes ierr = VecScatterBegin(rr,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 7605b2fa520SLois Curfman McInnes ierr = VecScatterEnd(rr,mdn->lvec,INSERT_VALUES,SCATTER_FORWARD,mdn->Mvctx);CHKERRQ(ierr); 761b1d4fb26SBarry Smith ierr = VecGetArrayFast(mdn->lvec,&r);CHKERRQ(ierr); 7625b2fa520SLois Curfman McInnes for (i=0; i<n; i++) { 7635b2fa520SLois Curfman McInnes x = r[i]; 7645b2fa520SLois Curfman McInnes v = mat->v + i*m; 7655b2fa520SLois Curfman McInnes for (j=0; j<m; j++) { (*v++) *= x;} 7665b2fa520SLois Curfman McInnes } 767b1d4fb26SBarry Smith ierr = VecRestoreArrayFast(mdn->lvec,&r);CHKERRQ(ierr); 768b0a32e0cSBarry Smith PetscLogFlops(n*m); 7695b2fa520SLois Curfman McInnes } 7705b2fa520SLois Curfman McInnes PetscFunctionReturn(0); 7715b2fa520SLois Curfman McInnes } 7725b2fa520SLois Curfman McInnes 7734a2ae208SSatish Balay #undef __FUNCT__ 7744a2ae208SSatish Balay #define __FUNCT__ "MatNorm_MPIDense" 775064f8208SBarry Smith int MatNorm_MPIDense(Mat A,NormType type,PetscReal *nrm) 776096963f5SLois Curfman McInnes { 7773501a2bdSLois Curfman McInnes Mat_MPIDense *mdn = (Mat_MPIDense*)A->data; 7783501a2bdSLois Curfman McInnes Mat_SeqDense *mat = (Mat_SeqDense*)mdn->A->data; 7793501a2bdSLois Curfman McInnes int ierr,i,j; 780329f5518SBarry Smith PetscReal sum = 0.0; 78187828ca2SBarry Smith PetscScalar *v = mat->v; 7823501a2bdSLois Curfman McInnes 7833a40ed3dSBarry Smith PetscFunctionBegin; 7843501a2bdSLois Curfman McInnes if (mdn->size == 1) { 785064f8208SBarry Smith ierr = MatNorm(mdn->A,type,nrm);CHKERRQ(ierr); 7863501a2bdSLois Curfman McInnes } else { 7873501a2bdSLois Curfman McInnes if (type == NORM_FROBENIUS) { 788273d9f13SBarry Smith for (i=0; i<mdn->A->n*mdn->A->m; i++) { 789aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 790329f5518SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 7913501a2bdSLois Curfman McInnes #else 7923501a2bdSLois Curfman McInnes sum += (*v)*(*v); v++; 7933501a2bdSLois Curfman McInnes #endif 7943501a2bdSLois Curfman McInnes } 795064f8208SBarry Smith ierr = MPI_Allreduce(&sum,nrm,1,MPIU_REAL,MPI_SUM,A->comm);CHKERRQ(ierr); 796064f8208SBarry Smith *nrm = sqrt(*nrm); 797b0a32e0cSBarry Smith PetscLogFlops(2*mdn->A->n*mdn->A->m); 7983a40ed3dSBarry Smith } else if (type == NORM_1) { 799329f5518SBarry Smith PetscReal *tmp,*tmp2; 800b0a32e0cSBarry Smith ierr = PetscMalloc(2*A->N*sizeof(PetscReal),&tmp);CHKERRQ(ierr); 801273d9f13SBarry Smith tmp2 = tmp + A->N; 802273d9f13SBarry Smith ierr = PetscMemzero(tmp,2*A->N*sizeof(PetscReal));CHKERRQ(ierr); 803064f8208SBarry Smith *nrm = 0.0; 8043501a2bdSLois Curfman McInnes v = mat->v; 805273d9f13SBarry Smith for (j=0; j<mdn->A->n; j++) { 806273d9f13SBarry Smith for (i=0; i<mdn->A->m; i++) { 80767e560aaSBarry Smith tmp[j] += PetscAbsScalar(*v); v++; 8083501a2bdSLois Curfman McInnes } 8093501a2bdSLois Curfman McInnes } 810d7d1e502SBarry Smith ierr = MPI_Allreduce(tmp,tmp2,A->N,MPIU_REAL,MPI_SUM,A->comm);CHKERRQ(ierr); 811273d9f13SBarry Smith for (j=0; j<A->N; j++) { 812064f8208SBarry Smith if (tmp2[j] > *nrm) *nrm = tmp2[j]; 8133501a2bdSLois Curfman McInnes } 814606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 815b0a32e0cSBarry Smith PetscLogFlops(A->n*A->m); 8163a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { /* max row norm */ 817329f5518SBarry Smith PetscReal ntemp; 8183501a2bdSLois Curfman McInnes ierr = MatNorm(mdn->A,type,&ntemp);CHKERRQ(ierr); 819064f8208SBarry Smith ierr = MPI_Allreduce(&ntemp,nrm,1,MPIU_REAL,MPI_MAX,A->comm);CHKERRQ(ierr); 8203a40ed3dSBarry Smith } else { 82129bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"No support for two norm"); 8223501a2bdSLois Curfman McInnes } 8233501a2bdSLois Curfman McInnes } 8243a40ed3dSBarry Smith PetscFunctionReturn(0); 8253501a2bdSLois Curfman McInnes } 8263501a2bdSLois Curfman McInnes 8274a2ae208SSatish Balay #undef __FUNCT__ 8284a2ae208SSatish Balay #define __FUNCT__ "MatTranspose_MPIDense" 8298f6be9afSLois Curfman McInnes int MatTranspose_MPIDense(Mat A,Mat *matout) 8303501a2bdSLois Curfman McInnes { 8313501a2bdSLois Curfman McInnes Mat_MPIDense *a = (Mat_MPIDense*)A->data; 8323501a2bdSLois Curfman McInnes Mat_SeqDense *Aloc = (Mat_SeqDense*)a->A->data; 8333501a2bdSLois Curfman McInnes Mat B; 834273d9f13SBarry Smith int M = A->M,N = A->N,m,n,*rwork,rstart = a->rstart; 8353501a2bdSLois Curfman McInnes int j,i,ierr; 83687828ca2SBarry Smith PetscScalar *v; 8373501a2bdSLois Curfman McInnes 8383a40ed3dSBarry Smith PetscFunctionBegin; 8397c922b88SBarry Smith if (!matout && M != N) { 84029bbc08cSBarry Smith SETERRQ(PETSC_ERR_SUP,"Supports square matrix only in-place"); 8417056b6fcSBarry Smith } 842878740d9SKris Buschelman ierr = MatCreate(A->comm,PETSC_DECIDE,PETSC_DECIDE,N,M,&B);CHKERRQ(ierr); 843878740d9SKris Buschelman ierr = MatSetType(B,A->type_name);CHKERRQ(ierr); 844878740d9SKris Buschelman ierr = MatMPIDenseSetPreallocation(B,PETSC_NULL);CHKERRQ(ierr); 8453501a2bdSLois Curfman McInnes 846273d9f13SBarry Smith m = a->A->m; n = a->A->n; v = Aloc->v; 847b0a32e0cSBarry Smith ierr = PetscMalloc(n*sizeof(int),&rwork);CHKERRQ(ierr); 8483501a2bdSLois Curfman McInnes for (j=0; j<n; j++) { 8493501a2bdSLois Curfman McInnes for (i=0; i<m; i++) rwork[i] = rstart + i; 8503501a2bdSLois Curfman McInnes ierr = MatSetValues(B,1,&j,m,rwork,v,INSERT_VALUES);CHKERRQ(ierr); 8513501a2bdSLois Curfman McInnes v += m; 8523501a2bdSLois Curfman McInnes } 853606d414cSSatish Balay ierr = PetscFree(rwork);CHKERRQ(ierr); 8546d4a8577SBarry Smith ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 8556d4a8577SBarry Smith ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 8567c922b88SBarry Smith if (matout) { 8573501a2bdSLois Curfman McInnes *matout = B; 8583501a2bdSLois Curfman McInnes } else { 859273d9f13SBarry Smith ierr = MatHeaderCopy(A,B);CHKERRQ(ierr); 8603501a2bdSLois Curfman McInnes } 8613a40ed3dSBarry Smith PetscFunctionReturn(0); 862096963f5SLois Curfman McInnes } 863096963f5SLois Curfman McInnes 864d9eff348SSatish Balay #include "petscblaslapack.h" 8654a2ae208SSatish Balay #undef __FUNCT__ 8664a2ae208SSatish Balay #define __FUNCT__ "MatScale_MPIDense" 867268466fbSBarry Smith int MatScale_MPIDense(const PetscScalar *alpha,Mat inA) 86844cd7ae7SLois Curfman McInnes { 86944cd7ae7SLois Curfman McInnes Mat_MPIDense *A = (Mat_MPIDense*)inA->data; 87044cd7ae7SLois Curfman McInnes Mat_SeqDense *a = (Mat_SeqDense*)A->A->data; 87144cd7ae7SLois Curfman McInnes int one = 1,nz; 87244cd7ae7SLois Curfman McInnes 8733a40ed3dSBarry Smith PetscFunctionBegin; 874273d9f13SBarry Smith nz = inA->m*inA->N; 875268466fbSBarry Smith BLscal_(&nz,(PetscScalar*)alpha,a->v,&one); 876b0a32e0cSBarry Smith PetscLogFlops(nz); 8773a40ed3dSBarry Smith PetscFunctionReturn(0); 87844cd7ae7SLois Curfman McInnes } 87944cd7ae7SLois Curfman McInnes 8805609ef8eSBarry Smith static int MatDuplicate_MPIDense(Mat,MatDuplicateOption,Mat *); 8818965ea79SLois Curfman McInnes 8824a2ae208SSatish Balay #undef __FUNCT__ 8834a2ae208SSatish Balay #define __FUNCT__ "MatSetUpPreallocation_MPIDense" 884273d9f13SBarry Smith int MatSetUpPreallocation_MPIDense(Mat A) 885273d9f13SBarry Smith { 886273d9f13SBarry Smith int ierr; 887273d9f13SBarry Smith 888273d9f13SBarry Smith PetscFunctionBegin; 889273d9f13SBarry Smith ierr = MatMPIDenseSetPreallocation(A,0);CHKERRQ(ierr); 890273d9f13SBarry Smith PetscFunctionReturn(0); 891273d9f13SBarry Smith } 892273d9f13SBarry Smith 8938965ea79SLois Curfman McInnes /* -------------------------------------------------------------------*/ 89409dc0095SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_MPIDense, 89509dc0095SBarry Smith MatGetRow_MPIDense, 89609dc0095SBarry Smith MatRestoreRow_MPIDense, 89709dc0095SBarry Smith MatMult_MPIDense, 89897304618SKris Buschelman /* 4*/ MatMultAdd_MPIDense, 8997c922b88SBarry Smith MatMultTranspose_MPIDense, 9007c922b88SBarry Smith MatMultTransposeAdd_MPIDense, 9018965ea79SLois Curfman McInnes 0, 90209dc0095SBarry Smith 0, 90309dc0095SBarry Smith 0, 90497304618SKris Buschelman /*10*/ 0, 90509dc0095SBarry Smith 0, 90609dc0095SBarry Smith 0, 90709dc0095SBarry Smith 0, 90809dc0095SBarry Smith MatTranspose_MPIDense, 90997304618SKris Buschelman /*15*/ MatGetInfo_MPIDense, 91097304618SKris Buschelman 0, 91109dc0095SBarry Smith MatGetDiagonal_MPIDense, 9125b2fa520SLois Curfman McInnes MatDiagonalScale_MPIDense, 91309dc0095SBarry Smith MatNorm_MPIDense, 91497304618SKris Buschelman /*20*/ MatAssemblyBegin_MPIDense, 91509dc0095SBarry Smith MatAssemblyEnd_MPIDense, 91609dc0095SBarry Smith 0, 91709dc0095SBarry Smith MatSetOption_MPIDense, 91809dc0095SBarry Smith MatZeroEntries_MPIDense, 91997304618SKris Buschelman /*25*/ MatZeroRows_MPIDense, 92009dc0095SBarry Smith 0, 92109dc0095SBarry Smith 0, 92209dc0095SBarry Smith 0, 92309dc0095SBarry Smith 0, 92497304618SKris Buschelman /*30*/ MatSetUpPreallocation_MPIDense, 925273d9f13SBarry Smith 0, 92609dc0095SBarry Smith 0, 92709dc0095SBarry Smith MatGetArray_MPIDense, 92809dc0095SBarry Smith MatRestoreArray_MPIDense, 92997304618SKris Buschelman /*35*/ MatDuplicate_MPIDense, 93009dc0095SBarry Smith 0, 93109dc0095SBarry Smith 0, 93209dc0095SBarry Smith 0, 93309dc0095SBarry Smith 0, 93497304618SKris Buschelman /*40*/ 0, 9352ce60cd0SSatish Balay MatGetSubMatrices_MPIDense, 93609dc0095SBarry Smith 0, 93709dc0095SBarry Smith MatGetValues_MPIDense, 93809dc0095SBarry Smith 0, 93997304618SKris Buschelman /*45*/ 0, 94009dc0095SBarry Smith MatScale_MPIDense, 94109dc0095SBarry Smith 0, 94209dc0095SBarry Smith 0, 94309dc0095SBarry Smith 0, 94497304618SKris Buschelman /*50*/ MatGetBlockSize_MPIDense, 94509dc0095SBarry Smith 0, 94609dc0095SBarry Smith 0, 94709dc0095SBarry Smith 0, 94809dc0095SBarry Smith 0, 94997304618SKris Buschelman /*55*/ 0, 95009dc0095SBarry Smith 0, 95109dc0095SBarry Smith 0, 95209dc0095SBarry Smith 0, 95309dc0095SBarry Smith 0, 95497304618SKris Buschelman /*60*/ MatGetSubMatrix_MPIDense, 955b9b97703SBarry Smith MatDestroy_MPIDense, 956b9b97703SBarry Smith MatView_MPIDense, 95797304618SKris Buschelman MatGetPetscMaps_Petsc, 95897304618SKris Buschelman 0, 95997304618SKris Buschelman /*65*/ 0, 96097304618SKris Buschelman 0, 96197304618SKris Buschelman 0, 96297304618SKris Buschelman 0, 96397304618SKris Buschelman 0, 96497304618SKris Buschelman /*70*/ 0, 96597304618SKris Buschelman 0, 96697304618SKris Buschelman 0, 96797304618SKris Buschelman 0, 96897304618SKris Buschelman 0, 96997304618SKris Buschelman /*75*/ 0, 97097304618SKris Buschelman 0, 97197304618SKris Buschelman 0, 97297304618SKris Buschelman 0, 97397304618SKris Buschelman 0, 97497304618SKris Buschelman /*80*/ 0, 97597304618SKris Buschelman 0, 97697304618SKris Buschelman 0, 97797304618SKris Buschelman 0, 97897304618SKris Buschelman /*85*/ MatLoad_MPIDense}; 9798965ea79SLois Curfman McInnes 980273d9f13SBarry Smith EXTERN_C_BEGIN 9814a2ae208SSatish Balay #undef __FUNCT__ 982a23d5eceSKris Buschelman #define __FUNCT__ "MatMPIDenseSetPreallocation_MPIDense" 983a23d5eceSKris Buschelman int MatMPIDenseSetPreallocation_MPIDense(Mat mat,PetscScalar *data) 984a23d5eceSKris Buschelman { 985a23d5eceSKris Buschelman Mat_MPIDense *a; 986a23d5eceSKris Buschelman int ierr; 987a23d5eceSKris Buschelman 988a23d5eceSKris Buschelman PetscFunctionBegin; 989a23d5eceSKris Buschelman mat->preallocated = PETSC_TRUE; 990a23d5eceSKris Buschelman /* Note: For now, when data is specified above, this assumes the user correctly 991a23d5eceSKris Buschelman allocates the local dense storage space. We should add error checking. */ 992a23d5eceSKris Buschelman 993a23d5eceSKris Buschelman a = (Mat_MPIDense*)mat->data; 9945c5985e7SKris Buschelman ierr = MatCreate(PETSC_COMM_SELF,mat->m,mat->N,mat->m,mat->N,&a->A);CHKERRQ(ierr); 9955c5985e7SKris Buschelman ierr = MatSetType(a->A,MATSEQDENSE);CHKERRQ(ierr); 9965c5985e7SKris Buschelman ierr = MatSeqDenseSetPreallocation(a->A,data);CHKERRQ(ierr); 997a23d5eceSKris Buschelman PetscLogObjectParent(mat,a->A); 998a23d5eceSKris Buschelman PetscFunctionReturn(0); 999a23d5eceSKris Buschelman } 1000a23d5eceSKris Buschelman EXTERN_C_END 1001a23d5eceSKris Buschelman 10020bad9183SKris Buschelman /*MC 1003fafad747SKris Buschelman MATMPIDENSE - MATMPIDENSE = "mpidense" - A matrix type to be used for distributed dense matrices. 10040bad9183SKris Buschelman 10050bad9183SKris Buschelman Options Database Keys: 10060bad9183SKris Buschelman . -mat_type mpidense - sets the matrix type to "mpidense" during a call to MatSetFromOptions() 10070bad9183SKris Buschelman 10080bad9183SKris Buschelman Level: beginner 10090bad9183SKris Buschelman 10100bad9183SKris Buschelman .seealso: MatCreateMPIDense 10110bad9183SKris Buschelman M*/ 10120bad9183SKris Buschelman 1013a23d5eceSKris Buschelman EXTERN_C_BEGIN 1014a23d5eceSKris Buschelman #undef __FUNCT__ 10154a2ae208SSatish Balay #define __FUNCT__ "MatCreate_MPIDense" 1016273d9f13SBarry Smith int MatCreate_MPIDense(Mat mat) 1017273d9f13SBarry Smith { 1018273d9f13SBarry Smith Mat_MPIDense *a; 1019273d9f13SBarry Smith int ierr,i; 1020273d9f13SBarry Smith 1021273d9f13SBarry Smith PetscFunctionBegin; 1022b0a32e0cSBarry Smith ierr = PetscNew(Mat_MPIDense,&a);CHKERRQ(ierr); 1023b0a32e0cSBarry Smith mat->data = (void*)a; 1024273d9f13SBarry Smith ierr = PetscMemcpy(mat->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 1025273d9f13SBarry Smith mat->factor = 0; 1026273d9f13SBarry Smith mat->mapping = 0; 1027273d9f13SBarry Smith 1028273d9f13SBarry Smith a->factor = 0; 1029273d9f13SBarry Smith mat->insertmode = NOT_SET_VALUES; 1030273d9f13SBarry Smith ierr = MPI_Comm_rank(mat->comm,&a->rank);CHKERRQ(ierr); 1031273d9f13SBarry Smith ierr = MPI_Comm_size(mat->comm,&a->size);CHKERRQ(ierr); 1032273d9f13SBarry Smith 1033273d9f13SBarry Smith ierr = PetscSplitOwnership(mat->comm,&mat->m,&mat->M);CHKERRQ(ierr); 1034273d9f13SBarry Smith ierr = PetscSplitOwnership(mat->comm,&mat->n,&mat->N);CHKERRQ(ierr); 1035273d9f13SBarry Smith a->nvec = mat->n; 1036273d9f13SBarry Smith 1037273d9f13SBarry Smith /* the information in the maps duplicates the information computed below, eventually 1038273d9f13SBarry Smith we should remove the duplicate information that is not contained in the maps */ 10398a124369SBarry Smith ierr = PetscMapCreateMPI(mat->comm,mat->m,mat->M,&mat->rmap);CHKERRQ(ierr); 10408a124369SBarry Smith ierr = PetscMapCreateMPI(mat->comm,mat->n,mat->N,&mat->cmap);CHKERRQ(ierr); 1041273d9f13SBarry Smith 1042273d9f13SBarry Smith /* build local table of row and column ownerships */ 1043b0a32e0cSBarry Smith ierr = PetscMalloc(2*(a->size+2)*sizeof(int),&a->rowners);CHKERRQ(ierr); 1044273d9f13SBarry Smith a->cowners = a->rowners + a->size + 1; 1045b0a32e0cSBarry Smith PetscLogObjectMemory(mat,2*(a->size+2)*sizeof(int)+sizeof(struct _p_Mat)+sizeof(Mat_MPIDense)); 1046273d9f13SBarry Smith ierr = MPI_Allgather(&mat->m,1,MPI_INT,a->rowners+1,1,MPI_INT,mat->comm);CHKERRQ(ierr); 1047273d9f13SBarry Smith a->rowners[0] = 0; 1048273d9f13SBarry Smith for (i=2; i<=a->size; i++) { 1049273d9f13SBarry Smith a->rowners[i] += a->rowners[i-1]; 1050273d9f13SBarry Smith } 1051273d9f13SBarry Smith a->rstart = a->rowners[a->rank]; 1052273d9f13SBarry Smith a->rend = a->rowners[a->rank+1]; 1053273d9f13SBarry Smith ierr = MPI_Allgather(&mat->n,1,MPI_INT,a->cowners+1,1,MPI_INT,mat->comm);CHKERRQ(ierr); 1054273d9f13SBarry Smith a->cowners[0] = 0; 1055273d9f13SBarry Smith for (i=2; i<=a->size; i++) { 1056273d9f13SBarry Smith a->cowners[i] += a->cowners[i-1]; 1057273d9f13SBarry Smith } 1058273d9f13SBarry Smith 1059273d9f13SBarry Smith /* build cache for off array entries formed */ 1060273d9f13SBarry Smith a->donotstash = PETSC_FALSE; 1061273d9f13SBarry Smith ierr = MatStashCreate_Private(mat->comm,1,&mat->stash);CHKERRQ(ierr); 1062273d9f13SBarry Smith 1063273d9f13SBarry Smith /* stuff used for matrix vector multiply */ 1064273d9f13SBarry Smith a->lvec = 0; 1065273d9f13SBarry Smith a->Mvctx = 0; 1066273d9f13SBarry Smith a->roworiented = PETSC_TRUE; 1067273d9f13SBarry Smith 1068273d9f13SBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatGetDiagonalBlock_C", 1069273d9f13SBarry Smith "MatGetDiagonalBlock_MPIDense", 1070273d9f13SBarry Smith MatGetDiagonalBlock_MPIDense);CHKERRQ(ierr); 1071a23d5eceSKris Buschelman ierr = PetscObjectComposeFunctionDynamic((PetscObject)mat,"MatMPIDenseSetPreallocation_C", 1072a23d5eceSKris Buschelman "MatMPIDenseSetPreallocation_MPIDense", 1073a23d5eceSKris Buschelman MatMPIDenseSetPreallocation_MPIDense);CHKERRQ(ierr); 1074273d9f13SBarry Smith PetscFunctionReturn(0); 1075273d9f13SBarry Smith } 1076273d9f13SBarry Smith EXTERN_C_END 1077273d9f13SBarry Smith 1078209238afSKris Buschelman /*MC 1079002d173eSKris Buschelman MATDENSE - MATDENSE = "dense" - A matrix type to be used for dense matrices. 1080209238afSKris Buschelman 1081209238afSKris Buschelman This matrix type is identical to MATSEQDENSE when constructed with a single process communicator, 1082209238afSKris Buschelman and MATMPIDENSE otherwise. 1083209238afSKris Buschelman 1084209238afSKris Buschelman Options Database Keys: 1085209238afSKris Buschelman . -mat_type dense - sets the matrix type to "dense" during a call to MatSetFromOptions() 1086209238afSKris Buschelman 1087209238afSKris Buschelman Level: beginner 1088209238afSKris Buschelman 1089209238afSKris Buschelman .seealso: MatCreateMPIDense,MATSEQDENSE,MATMPIDENSE 1090209238afSKris Buschelman M*/ 1091209238afSKris Buschelman 1092209238afSKris Buschelman EXTERN_C_BEGIN 1093209238afSKris Buschelman #undef __FUNCT__ 1094209238afSKris Buschelman #define __FUNCT__ "MatCreate_Dense" 1095209238afSKris Buschelman int MatCreate_Dense(Mat A) { 1096209238afSKris Buschelman int ierr,size; 1097209238afSKris Buschelman 1098209238afSKris Buschelman PetscFunctionBegin; 1099209238afSKris Buschelman ierr = PetscObjectChangeTypeName((PetscObject)A,MATDENSE);CHKERRQ(ierr); 1100209238afSKris Buschelman ierr = MPI_Comm_size(A->comm,&size);CHKERRQ(ierr); 1101209238afSKris Buschelman if (size == 1) { 1102209238afSKris Buschelman ierr = MatSetType(A,MATSEQDENSE);CHKERRQ(ierr); 1103209238afSKris Buschelman } else { 1104209238afSKris Buschelman ierr = MatSetType(A,MATMPIDENSE);CHKERRQ(ierr); 1105209238afSKris Buschelman } 1106209238afSKris Buschelman PetscFunctionReturn(0); 1107209238afSKris Buschelman } 1108209238afSKris Buschelman EXTERN_C_END 1109209238afSKris Buschelman 11104a2ae208SSatish Balay #undef __FUNCT__ 11114a2ae208SSatish Balay #define __FUNCT__ "MatMPIDenseSetPreallocation" 1112273d9f13SBarry Smith /*@C 1113273d9f13SBarry Smith MatMPIDenseSetPreallocation - Sets the array used to store the matrix entries 1114273d9f13SBarry Smith 1115273d9f13SBarry Smith Not collective 1116273d9f13SBarry Smith 1117273d9f13SBarry Smith Input Parameters: 1118273d9f13SBarry Smith . A - the matrix 1119273d9f13SBarry Smith - data - optional location of matrix data. Set data=PETSC_NULL for PETSc 1120273d9f13SBarry Smith to control all matrix memory allocation. 1121273d9f13SBarry Smith 1122273d9f13SBarry Smith Notes: 1123273d9f13SBarry Smith The dense format is fully compatible with standard Fortran 77 1124273d9f13SBarry Smith storage by columns. 1125273d9f13SBarry Smith 1126273d9f13SBarry Smith The data input variable is intended primarily for Fortran programmers 1127273d9f13SBarry Smith who wish to allocate their own matrix memory space. Most users should 1128273d9f13SBarry Smith set data=PETSC_NULL. 1129273d9f13SBarry Smith 1130273d9f13SBarry Smith Level: intermediate 1131273d9f13SBarry Smith 1132273d9f13SBarry Smith .keywords: matrix,dense, parallel 1133273d9f13SBarry Smith 1134273d9f13SBarry Smith .seealso: MatCreate(), MatCreateSeqDense(), MatSetValues() 1135273d9f13SBarry Smith @*/ 113687828ca2SBarry Smith int MatMPIDenseSetPreallocation(Mat mat,PetscScalar *data) 1137273d9f13SBarry Smith { 1138a23d5eceSKris Buschelman int ierr,(*f)(Mat,PetscScalar *); 1139273d9f13SBarry Smith 1140273d9f13SBarry Smith PetscFunctionBegin; 1141565567f0SKris Buschelman ierr = PetscObjectQueryFunction((PetscObject)mat,"MatMPIDenseSetPreallocation_C",(void (**)(void))&f);CHKERRQ(ierr); 1142a23d5eceSKris Buschelman if (f) { 1143a23d5eceSKris Buschelman ierr = (*f)(mat,data);CHKERRQ(ierr); 1144a23d5eceSKris Buschelman } 1145273d9f13SBarry Smith PetscFunctionReturn(0); 1146273d9f13SBarry Smith } 1147273d9f13SBarry Smith 11484a2ae208SSatish Balay #undef __FUNCT__ 11494a2ae208SSatish Balay #define __FUNCT__ "MatCreateMPIDense" 11508965ea79SLois Curfman McInnes /*@C 115139ddd567SLois Curfman McInnes MatCreateMPIDense - Creates a sparse parallel matrix in dense format. 11528965ea79SLois Curfman McInnes 1153db81eaa0SLois Curfman McInnes Collective on MPI_Comm 1154db81eaa0SLois Curfman McInnes 11558965ea79SLois Curfman McInnes Input Parameters: 1156db81eaa0SLois Curfman McInnes + comm - MPI communicator 11578965ea79SLois Curfman McInnes . m - number of local rows (or PETSC_DECIDE to have calculated if M is given) 1158db81eaa0SLois Curfman McInnes . n - number of local columns (or PETSC_DECIDE to have calculated if N is given) 11598965ea79SLois Curfman McInnes . M - number of global rows (or PETSC_DECIDE to have calculated if m is given) 1160db81eaa0SLois Curfman McInnes . N - number of global columns (or PETSC_DECIDE to have calculated if n is given) 11617f5ff6fdSBarry Smith - data - optional location of matrix data. Set data=PETSC_NULL (PETSC_NULL_SCALAR for Fortran users) for PETSc 1162dfc5480cSLois Curfman McInnes to control all matrix memory allocation. 11638965ea79SLois Curfman McInnes 11648965ea79SLois Curfman McInnes Output Parameter: 1165477f1c0bSLois Curfman McInnes . A - the matrix 11668965ea79SLois Curfman McInnes 1167b259b22eSLois Curfman McInnes Notes: 116839ddd567SLois Curfman McInnes The dense format is fully compatible with standard Fortran 77 116939ddd567SLois Curfman McInnes storage by columns. 11708965ea79SLois Curfman McInnes 117118f449edSLois Curfman McInnes The data input variable is intended primarily for Fortran programmers 117218f449edSLois Curfman McInnes who wish to allocate their own matrix memory space. Most users should 11737f5ff6fdSBarry Smith set data=PETSC_NULL (PETSC_NULL_SCALAR for Fortran users). 117418f449edSLois Curfman McInnes 11758965ea79SLois Curfman McInnes The user MUST specify either the local or global matrix dimensions 11768965ea79SLois Curfman McInnes (possibly both). 11778965ea79SLois Curfman McInnes 1178027ccd11SLois Curfman McInnes Level: intermediate 1179027ccd11SLois Curfman McInnes 118039ddd567SLois Curfman McInnes .keywords: matrix,dense, parallel 11818965ea79SLois Curfman McInnes 118239ddd567SLois Curfman McInnes .seealso: MatCreate(), MatCreateSeqDense(), MatSetValues() 11838965ea79SLois Curfman McInnes @*/ 118487828ca2SBarry Smith int MatCreateMPIDense(MPI_Comm comm,int m,int n,int M,int N,PetscScalar *data,Mat *A) 11858965ea79SLois Curfman McInnes { 1186273d9f13SBarry Smith int ierr,size; 11878965ea79SLois Curfman McInnes 11883a40ed3dSBarry Smith PetscFunctionBegin; 1189273d9f13SBarry Smith ierr = MatCreate(comm,m,n,M,N,A);CHKERRQ(ierr); 1190273d9f13SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1191273d9f13SBarry Smith if (size > 1) { 1192273d9f13SBarry Smith ierr = MatSetType(*A,MATMPIDENSE);CHKERRQ(ierr); 1193273d9f13SBarry Smith ierr = MatMPIDenseSetPreallocation(*A,data);CHKERRQ(ierr); 1194273d9f13SBarry Smith } else { 1195273d9f13SBarry Smith ierr = MatSetType(*A,MATSEQDENSE);CHKERRQ(ierr); 1196273d9f13SBarry Smith ierr = MatSeqDenseSetPreallocation(*A,data);CHKERRQ(ierr); 11978c469469SLois Curfman McInnes } 11983a40ed3dSBarry Smith PetscFunctionReturn(0); 11998965ea79SLois Curfman McInnes } 12008965ea79SLois Curfman McInnes 12014a2ae208SSatish Balay #undef __FUNCT__ 12024a2ae208SSatish Balay #define __FUNCT__ "MatDuplicate_MPIDense" 12035609ef8eSBarry Smith static int MatDuplicate_MPIDense(Mat A,MatDuplicateOption cpvalues,Mat *newmat) 12048965ea79SLois Curfman McInnes { 12058965ea79SLois Curfman McInnes Mat mat; 12063501a2bdSLois Curfman McInnes Mat_MPIDense *a,*oldmat = (Mat_MPIDense*)A->data; 120739ddd567SLois Curfman McInnes int ierr; 12088965ea79SLois Curfman McInnes 12093a40ed3dSBarry Smith PetscFunctionBegin; 12108965ea79SLois Curfman McInnes *newmat = 0; 1211273d9f13SBarry Smith ierr = MatCreate(A->comm,A->m,A->n,A->M,A->N,&mat);CHKERRQ(ierr); 1212*be5d1d56SKris Buschelman ierr = MatSetType(mat,A->type_name);CHKERRQ(ierr); 1213b0a32e0cSBarry Smith ierr = PetscNew(Mat_MPIDense,&a);CHKERRQ(ierr); 1214b0a32e0cSBarry Smith mat->data = (void*)a; 1215549d3d68SSatish Balay ierr = PetscMemcpy(mat->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 12163501a2bdSLois Curfman McInnes mat->factor = A->factor; 1217c456f294SBarry Smith mat->assembled = PETSC_TRUE; 1218273d9f13SBarry Smith mat->preallocated = PETSC_TRUE; 12198965ea79SLois Curfman McInnes 12208965ea79SLois Curfman McInnes a->rstart = oldmat->rstart; 12218965ea79SLois Curfman McInnes a->rend = oldmat->rend; 12228965ea79SLois Curfman McInnes a->size = oldmat->size; 12238965ea79SLois Curfman McInnes a->rank = oldmat->rank; 1224e0fa3b82SLois Curfman McInnes mat->insertmode = NOT_SET_VALUES; 1225b9b97703SBarry Smith a->nvec = oldmat->nvec; 12263782ba37SSatish Balay a->donotstash = oldmat->donotstash; 1227b0a32e0cSBarry Smith ierr = PetscMalloc((a->size+1)*sizeof(int),&a->rowners);CHKERRQ(ierr); 1228b0a32e0cSBarry Smith PetscLogObjectMemory(mat,(a->size+1)*sizeof(int)+sizeof(struct _p_Mat)+sizeof(Mat_MPIDense)); 1229549d3d68SSatish Balay ierr = PetscMemcpy(a->rowners,oldmat->rowners,(a->size+1)*sizeof(int));CHKERRQ(ierr); 12308798bf22SSatish Balay ierr = MatStashCreate_Private(A->comm,1,&mat->stash);CHKERRQ(ierr); 12318965ea79SLois Curfman McInnes 1232329f5518SBarry Smith ierr = MatSetUpMultiply_MPIDense(mat);CHKERRQ(ierr); 12335609ef8eSBarry Smith ierr = MatDuplicate(oldmat->A,cpvalues,&a->A);CHKERRQ(ierr); 1234b0a32e0cSBarry Smith PetscLogObjectParent(mat,a->A); 12358965ea79SLois Curfman McInnes *newmat = mat; 12363a40ed3dSBarry Smith PetscFunctionReturn(0); 12378965ea79SLois Curfman McInnes } 12388965ea79SLois Curfman McInnes 1239e090d566SSatish Balay #include "petscsys.h" 12408965ea79SLois Curfman McInnes 12414a2ae208SSatish Balay #undef __FUNCT__ 12424a2ae208SSatish Balay #define __FUNCT__ "MatLoad_MPIDense_DenseInFile" 1243*be5d1d56SKris Buschelman int MatLoad_MPIDense_DenseInFile(MPI_Comm comm,int fd,int M,int N,const MatType type,Mat *newmat) 124490ace30eSBarry Smith { 124540011551SBarry Smith int *rowners,i,size,rank,m,ierr,nz,j; 124687828ca2SBarry Smith PetscScalar *array,*vals,*vals_ptr; 124790ace30eSBarry Smith MPI_Status status; 124890ace30eSBarry Smith 12493a40ed3dSBarry Smith PetscFunctionBegin; 1250d132466eSBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 1251d132466eSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 125290ace30eSBarry Smith 125390ace30eSBarry Smith /* determine ownership of all rows */ 125490ace30eSBarry Smith m = M/size + ((M % size) > rank); 1255b0a32e0cSBarry Smith ierr = PetscMalloc((size+2)*sizeof(int),&rowners);CHKERRQ(ierr); 1256ca161407SBarry Smith ierr = MPI_Allgather(&m,1,MPI_INT,rowners+1,1,MPI_INT,comm);CHKERRQ(ierr); 125790ace30eSBarry Smith rowners[0] = 0; 125890ace30eSBarry Smith for (i=2; i<=size; i++) { 125990ace30eSBarry Smith rowners[i] += rowners[i-1]; 126090ace30eSBarry Smith } 126190ace30eSBarry Smith 1262878740d9SKris Buschelman ierr = MatCreate(comm,m,PETSC_DECIDE,M,N,newmat);CHKERRQ(ierr); 1263*be5d1d56SKris Buschelman ierr = MatSetType(*newmat,type);CHKERRQ(ierr); 1264878740d9SKris Buschelman ierr = MatMPIDenseSetPreallocation(*newmat,PETSC_NULL);CHKERRQ(ierr); 126590ace30eSBarry Smith ierr = MatGetArray(*newmat,&array);CHKERRQ(ierr); 126690ace30eSBarry Smith 126790ace30eSBarry Smith if (!rank) { 126887828ca2SBarry Smith ierr = PetscMalloc(m*N*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 126990ace30eSBarry Smith 127090ace30eSBarry Smith /* read in my part of the matrix numerical values */ 12710752156aSBarry Smith ierr = PetscBinaryRead(fd,vals,m*N,PETSC_SCALAR);CHKERRQ(ierr); 127290ace30eSBarry Smith 127390ace30eSBarry Smith /* insert into matrix-by row (this is why cannot directly read into array */ 127490ace30eSBarry Smith vals_ptr = vals; 127590ace30eSBarry Smith for (i=0; i<m; i++) { 127690ace30eSBarry Smith for (j=0; j<N; j++) { 127790ace30eSBarry Smith array[i + j*m] = *vals_ptr++; 127890ace30eSBarry Smith } 127990ace30eSBarry Smith } 128090ace30eSBarry Smith 128190ace30eSBarry Smith /* read in other processors and ship out */ 128290ace30eSBarry Smith for (i=1; i<size; i++) { 128390ace30eSBarry Smith nz = (rowners[i+1] - rowners[i])*N; 12840752156aSBarry Smith ierr = PetscBinaryRead(fd,vals,nz,PETSC_SCALAR);CHKERRQ(ierr); 1285ca161407SBarry Smith ierr = MPI_Send(vals,nz,MPIU_SCALAR,i,(*newmat)->tag,comm);CHKERRQ(ierr); 128690ace30eSBarry Smith } 12873a40ed3dSBarry Smith } else { 128890ace30eSBarry Smith /* receive numeric values */ 128987828ca2SBarry Smith ierr = PetscMalloc(m*N*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 129090ace30eSBarry Smith 129190ace30eSBarry Smith /* receive message of values*/ 1292ca161407SBarry Smith ierr = MPI_Recv(vals,m*N,MPIU_SCALAR,0,(*newmat)->tag,comm,&status);CHKERRQ(ierr); 129390ace30eSBarry Smith 129490ace30eSBarry Smith /* insert into matrix-by row (this is why cannot directly read into array */ 129590ace30eSBarry Smith vals_ptr = vals; 129690ace30eSBarry Smith for (i=0; i<m; i++) { 129790ace30eSBarry Smith for (j=0; j<N; j++) { 129890ace30eSBarry Smith array[i + j*m] = *vals_ptr++; 129990ace30eSBarry Smith } 130090ace30eSBarry Smith } 130190ace30eSBarry Smith } 1302606d414cSSatish Balay ierr = PetscFree(rowners);CHKERRQ(ierr); 1303606d414cSSatish Balay ierr = PetscFree(vals);CHKERRQ(ierr); 13046d4a8577SBarry Smith ierr = MatAssemblyBegin(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13056d4a8577SBarry Smith ierr = MatAssemblyEnd(*newmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13063a40ed3dSBarry Smith PetscFunctionReturn(0); 130790ace30eSBarry Smith } 130890ace30eSBarry Smith 13094a2ae208SSatish Balay #undef __FUNCT__ 13104a2ae208SSatish Balay #define __FUNCT__ "MatLoad_MPIDense" 13118e9aea5cSBarry Smith int MatLoad_MPIDense(PetscViewer viewer,const MatType type,Mat *newmat) 13128965ea79SLois Curfman McInnes { 13138965ea79SLois Curfman McInnes Mat A; 131487828ca2SBarry Smith PetscScalar *vals,*svals; 131519bcc07fSBarry Smith MPI_Comm comm = ((PetscObject)viewer)->comm; 13168965ea79SLois Curfman McInnes MPI_Status status; 13178965ea79SLois Curfman McInnes int header[4],rank,size,*rowlengths = 0,M,N,m,*rowners,maxnz,*cols; 13188965ea79SLois Curfman McInnes int *ourlens,*sndcounts = 0,*procsnz = 0,*offlens,jj,*mycols,*smycols; 131919bcc07fSBarry Smith int tag = ((PetscObject)viewer)->tag; 13203a40ed3dSBarry Smith int i,nz,ierr,j,rstart,rend,fd; 13218965ea79SLois Curfman McInnes 13223a40ed3dSBarry Smith PetscFunctionBegin; 1323d132466eSBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1324d132466eSBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 13258965ea79SLois Curfman McInnes if (!rank) { 1326b0a32e0cSBarry Smith ierr = PetscViewerBinaryGetDescriptor(viewer,&fd);CHKERRQ(ierr); 13270752156aSBarry Smith ierr = PetscBinaryRead(fd,(char *)header,4,PETSC_INT);CHKERRQ(ierr); 1328552e946dSBarry Smith if (header[0] != MAT_FILE_COOKIE) SETERRQ(PETSC_ERR_FILE_UNEXPECTED,"not matrix object"); 13298965ea79SLois Curfman McInnes } 13308965ea79SLois Curfman McInnes 1331ca161407SBarry Smith ierr = MPI_Bcast(header+1,3,MPI_INT,0,comm);CHKERRQ(ierr); 133290ace30eSBarry Smith M = header[1]; N = header[2]; nz = header[3]; 133390ace30eSBarry Smith 133490ace30eSBarry Smith /* 133590ace30eSBarry Smith Handle case where matrix is stored on disk as a dense matrix 133690ace30eSBarry Smith */ 133790ace30eSBarry Smith if (nz == MATRIX_BINARY_FORMAT_DENSE) { 1338*be5d1d56SKris Buschelman ierr = MatLoad_MPIDense_DenseInFile(comm,fd,M,N,type,newmat);CHKERRQ(ierr); 13393a40ed3dSBarry Smith PetscFunctionReturn(0); 134090ace30eSBarry Smith } 134190ace30eSBarry Smith 13428965ea79SLois Curfman McInnes /* determine ownership of all rows */ 13438965ea79SLois Curfman McInnes m = M/size + ((M % size) > rank); 1344b0a32e0cSBarry Smith ierr = PetscMalloc((size+2)*sizeof(int),&rowners);CHKERRQ(ierr); 1345ca161407SBarry Smith ierr = MPI_Allgather(&m,1,MPI_INT,rowners+1,1,MPI_INT,comm);CHKERRQ(ierr); 13468965ea79SLois Curfman McInnes rowners[0] = 0; 13478965ea79SLois Curfman McInnes for (i=2; i<=size; i++) { 13488965ea79SLois Curfman McInnes rowners[i] += rowners[i-1]; 13498965ea79SLois Curfman McInnes } 13508965ea79SLois Curfman McInnes rstart = rowners[rank]; 13518965ea79SLois Curfman McInnes rend = rowners[rank+1]; 13528965ea79SLois Curfman McInnes 13538965ea79SLois Curfman McInnes /* distribute row lengths to all processors */ 1354b0a32e0cSBarry Smith ierr = PetscMalloc(2*(rend-rstart)*sizeof(int),&ourlens);CHKERRQ(ierr); 13558965ea79SLois Curfman McInnes offlens = ourlens + (rend-rstart); 13568965ea79SLois Curfman McInnes if (!rank) { 1357b0a32e0cSBarry Smith ierr = PetscMalloc(M*sizeof(int),&rowlengths);CHKERRQ(ierr); 13580752156aSBarry Smith ierr = PetscBinaryRead(fd,rowlengths,M,PETSC_INT);CHKERRQ(ierr); 1359b0a32e0cSBarry Smith ierr = PetscMalloc(size*sizeof(int),&sndcounts);CHKERRQ(ierr); 13608965ea79SLois Curfman McInnes for (i=0; i<size; i++) sndcounts[i] = rowners[i+1] - rowners[i]; 1361ca161407SBarry Smith ierr = MPI_Scatterv(rowlengths,sndcounts,rowners,MPI_INT,ourlens,rend-rstart,MPI_INT,0,comm);CHKERRQ(ierr); 1362606d414cSSatish Balay ierr = PetscFree(sndcounts);CHKERRQ(ierr); 1363ca161407SBarry Smith } else { 1364ca161407SBarry Smith ierr = MPI_Scatterv(0,0,0,MPI_INT,ourlens,rend-rstart,MPI_INT,0,comm);CHKERRQ(ierr); 13658965ea79SLois Curfman McInnes } 13668965ea79SLois Curfman McInnes 13678965ea79SLois Curfman McInnes if (!rank) { 13688965ea79SLois Curfman McInnes /* calculate the number of nonzeros on each processor */ 1369b0a32e0cSBarry Smith ierr = PetscMalloc(size*sizeof(int),&procsnz);CHKERRQ(ierr); 1370549d3d68SSatish Balay ierr = PetscMemzero(procsnz,size*sizeof(int));CHKERRQ(ierr); 13718965ea79SLois Curfman McInnes for (i=0; i<size; i++) { 13728965ea79SLois Curfman McInnes for (j=rowners[i]; j< rowners[i+1]; j++) { 13738965ea79SLois Curfman McInnes procsnz[i] += rowlengths[j]; 13748965ea79SLois Curfman McInnes } 13758965ea79SLois Curfman McInnes } 1376606d414cSSatish Balay ierr = PetscFree(rowlengths);CHKERRQ(ierr); 13778965ea79SLois Curfman McInnes 13788965ea79SLois Curfman McInnes /* determine max buffer needed and allocate it */ 13798965ea79SLois Curfman McInnes maxnz = 0; 13808965ea79SLois Curfman McInnes for (i=0; i<size; i++) { 13810452661fSBarry Smith maxnz = PetscMax(maxnz,procsnz[i]); 13828965ea79SLois Curfman McInnes } 1383b0a32e0cSBarry Smith ierr = PetscMalloc(maxnz*sizeof(int),&cols);CHKERRQ(ierr); 13848965ea79SLois Curfman McInnes 13858965ea79SLois Curfman McInnes /* read in my part of the matrix column indices */ 13868965ea79SLois Curfman McInnes nz = procsnz[0]; 1387b0a32e0cSBarry Smith ierr = PetscMalloc(nz*sizeof(int),&mycols);CHKERRQ(ierr); 13880752156aSBarry Smith ierr = PetscBinaryRead(fd,mycols,nz,PETSC_INT);CHKERRQ(ierr); 13898965ea79SLois Curfman McInnes 13908965ea79SLois Curfman McInnes /* read in every one elses and ship off */ 13918965ea79SLois Curfman McInnes for (i=1; i<size; i++) { 13928965ea79SLois Curfman McInnes nz = procsnz[i]; 13930752156aSBarry Smith ierr = PetscBinaryRead(fd,cols,nz,PETSC_INT);CHKERRQ(ierr); 1394ca161407SBarry Smith ierr = MPI_Send(cols,nz,MPI_INT,i,tag,comm);CHKERRQ(ierr); 13958965ea79SLois Curfman McInnes } 1396606d414cSSatish Balay ierr = PetscFree(cols);CHKERRQ(ierr); 13973a40ed3dSBarry Smith } else { 13988965ea79SLois Curfman McInnes /* determine buffer space needed for message */ 13998965ea79SLois Curfman McInnes nz = 0; 14008965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14018965ea79SLois Curfman McInnes nz += ourlens[i]; 14028965ea79SLois Curfman McInnes } 1403b0a32e0cSBarry Smith ierr = PetscMalloc(nz*sizeof(int),&mycols);CHKERRQ(ierr); 14048965ea79SLois Curfman McInnes 14058965ea79SLois Curfman McInnes /* receive message of column indices*/ 1406ca161407SBarry Smith ierr = MPI_Recv(mycols,nz,MPI_INT,0,tag,comm,&status);CHKERRQ(ierr); 1407ca161407SBarry Smith ierr = MPI_Get_count(&status,MPI_INT,&maxnz);CHKERRQ(ierr); 140829bbc08cSBarry Smith if (maxnz != nz) SETERRQ(PETSC_ERR_FILE_UNEXPECTED,"something is wrong with file"); 14098965ea79SLois Curfman McInnes } 14108965ea79SLois Curfman McInnes 14118965ea79SLois Curfman McInnes /* loop over local rows, determining number of off diagonal entries */ 1412549d3d68SSatish Balay ierr = PetscMemzero(offlens,m*sizeof(int));CHKERRQ(ierr); 14138965ea79SLois Curfman McInnes jj = 0; 14148965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14158965ea79SLois Curfman McInnes for (j=0; j<ourlens[i]; j++) { 14168965ea79SLois Curfman McInnes if (mycols[jj] < rstart || mycols[jj] >= rend) offlens[i]++; 14178965ea79SLois Curfman McInnes jj++; 14188965ea79SLois Curfman McInnes } 14198965ea79SLois Curfman McInnes } 14208965ea79SLois Curfman McInnes 14218965ea79SLois Curfman McInnes /* create our matrix */ 14228965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14238965ea79SLois Curfman McInnes ourlens[i] -= offlens[i]; 14248965ea79SLois Curfman McInnes } 1425878740d9SKris Buschelman ierr = MatCreate(comm,m,PETSC_DECIDE,M,N,newmat);CHKERRQ(ierr); 1426*be5d1d56SKris Buschelman ierr = MatSetType(*newmat,type);CHKERRQ(ierr); 1427878740d9SKris Buschelman ierr = MatMPIDenseSetPreallocation(*newmat,PETSC_NULL);CHKERRQ(ierr); 14288965ea79SLois Curfman McInnes A = *newmat; 14298965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14308965ea79SLois Curfman McInnes ourlens[i] += offlens[i]; 14318965ea79SLois Curfman McInnes } 14328965ea79SLois Curfman McInnes 14338965ea79SLois Curfman McInnes if (!rank) { 143487828ca2SBarry Smith ierr = PetscMalloc(maxnz*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 14358965ea79SLois Curfman McInnes 14368965ea79SLois Curfman McInnes /* read in my part of the matrix numerical values */ 14378965ea79SLois Curfman McInnes nz = procsnz[0]; 14380752156aSBarry Smith ierr = PetscBinaryRead(fd,vals,nz,PETSC_SCALAR);CHKERRQ(ierr); 14398965ea79SLois Curfman McInnes 14408965ea79SLois Curfman McInnes /* insert into matrix */ 14418965ea79SLois Curfman McInnes jj = rstart; 14428965ea79SLois Curfman McInnes smycols = mycols; 14438965ea79SLois Curfman McInnes svals = vals; 14448965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14458965ea79SLois Curfman McInnes ierr = MatSetValues(A,1,&jj,ourlens[i],smycols,svals,INSERT_VALUES);CHKERRQ(ierr); 14468965ea79SLois Curfman McInnes smycols += ourlens[i]; 14478965ea79SLois Curfman McInnes svals += ourlens[i]; 14488965ea79SLois Curfman McInnes jj++; 14498965ea79SLois Curfman McInnes } 14508965ea79SLois Curfman McInnes 14518965ea79SLois Curfman McInnes /* read in other processors and ship out */ 14528965ea79SLois Curfman McInnes for (i=1; i<size; i++) { 14538965ea79SLois Curfman McInnes nz = procsnz[i]; 14540752156aSBarry Smith ierr = PetscBinaryRead(fd,vals,nz,PETSC_SCALAR);CHKERRQ(ierr); 1455ca161407SBarry Smith ierr = MPI_Send(vals,nz,MPIU_SCALAR,i,A->tag,comm);CHKERRQ(ierr); 14568965ea79SLois Curfman McInnes } 1457606d414cSSatish Balay ierr = PetscFree(procsnz);CHKERRQ(ierr); 14583a40ed3dSBarry Smith } else { 14598965ea79SLois Curfman McInnes /* receive numeric values */ 146087828ca2SBarry Smith ierr = PetscMalloc(nz*sizeof(PetscScalar),&vals);CHKERRQ(ierr); 14618965ea79SLois Curfman McInnes 14628965ea79SLois Curfman McInnes /* receive message of values*/ 1463ca161407SBarry Smith ierr = MPI_Recv(vals,nz,MPIU_SCALAR,0,A->tag,comm,&status);CHKERRQ(ierr); 1464ca161407SBarry Smith ierr = MPI_Get_count(&status,MPIU_SCALAR,&maxnz);CHKERRQ(ierr); 146529bbc08cSBarry Smith if (maxnz != nz) SETERRQ(PETSC_ERR_FILE_UNEXPECTED,"something is wrong with file"); 14668965ea79SLois Curfman McInnes 14678965ea79SLois Curfman McInnes /* insert into matrix */ 14688965ea79SLois Curfman McInnes jj = rstart; 14698965ea79SLois Curfman McInnes smycols = mycols; 14708965ea79SLois Curfman McInnes svals = vals; 14718965ea79SLois Curfman McInnes for (i=0; i<m; i++) { 14728965ea79SLois Curfman McInnes ierr = MatSetValues(A,1,&jj,ourlens[i],smycols,svals,INSERT_VALUES);CHKERRQ(ierr); 14738965ea79SLois Curfman McInnes smycols += ourlens[i]; 14748965ea79SLois Curfman McInnes svals += ourlens[i]; 14758965ea79SLois Curfman McInnes jj++; 14768965ea79SLois Curfman McInnes } 14778965ea79SLois Curfman McInnes } 1478606d414cSSatish Balay ierr = PetscFree(ourlens);CHKERRQ(ierr); 1479606d414cSSatish Balay ierr = PetscFree(vals);CHKERRQ(ierr); 1480606d414cSSatish Balay ierr = PetscFree(mycols);CHKERRQ(ierr); 1481606d414cSSatish Balay ierr = PetscFree(rowners);CHKERRQ(ierr); 14828965ea79SLois Curfman McInnes 14836d4a8577SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14846d4a8577SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14853a40ed3dSBarry Smith PetscFunctionReturn(0); 14868965ea79SLois Curfman McInnes } 148790ace30eSBarry Smith 148890ace30eSBarry Smith 148990ace30eSBarry Smith 149090ace30eSBarry Smith 149190ace30eSBarry Smith 1492