xref: /petsc/src/mat/impls/aij/mpi/mmaij.c (revision 5615d1e584023db9367fb782d85b1b4ebbb8df18)
1cb512458SBarry Smith #ifndef lint
2*5615d1e5SSatish Balay static char vcid[] = "$Id: mmaij.c,v 1.34 1996/12/17 18:18:08 balay Exp balay $";
3cb512458SBarry Smith #endif
48c79f6d3SBarry Smith 
5d6dfbf8fSBarry Smith 
68c79f6d3SBarry Smith /*
78c79f6d3SBarry Smith    Support for the parallel AIJ matrix vector multiply
88c79f6d3SBarry Smith */
970f55243SBarry Smith #include "src/mat/impls/aij/mpi/mpiaij.h"
10f5eb4b81SSatish Balay #include "src/vec/vecimpl.h"
118c79f6d3SBarry Smith 
12*5615d1e5SSatish Balay #undef __FUNC__
13*5615d1e5SSatish Balay #define __FUNC__ "MatSetUpMultiply_MPIAIJ"
1444a69424SLois Curfman McInnes int MatSetUpMultiply_MPIAIJ(Mat mat)
158c79f6d3SBarry Smith {
1644a69424SLois Curfman McInnes   Mat_MPIAIJ *aij = (Mat_MPIAIJ *) mat->data;
17ec8511deSBarry Smith   Mat_SeqAIJ *B = (Mat_SeqAIJ *) (aij->B->data);
18416022c9SBarry Smith   int        N = aij->N,i,j,*indices,*aj = B->j,ierr,ec = 0,*garray;
19416022c9SBarry Smith   int        shift = B->indexshift;
201eb62cbbSBarry Smith   IS         from,to;
211eb62cbbSBarry Smith   Vec        gvec;
228c79f6d3SBarry Smith 
238c79f6d3SBarry Smith   /* For the first stab we make an array as long as the number of columns */
241eb62cbbSBarry Smith   /* mark those columns that are in aij->B */
25ac03b0baSBarry Smith   indices = (int *) PetscMalloc( (N+1)*sizeof(int) ); CHKPTRQ(indices);
26cddf8d76SBarry Smith   PetscMemzero(indices,N*sizeof(int));
27d6dfbf8fSBarry Smith   for ( i=0; i<B->m; i++ ) {
28d6dfbf8fSBarry Smith     for ( j=0; j<B->ilen[i]; j++ ) {
29dbb450caSBarry Smith       if (!indices[aj[B->i[i] +shift + j] + shift]) ec++;
30416022c9SBarry Smith       indices[aj[B->i[i] + shift + j] + shift] = 1;
31416022c9SBarry Smith     }
321eb62cbbSBarry Smith   }
338c79f6d3SBarry Smith 
341eb62cbbSBarry Smith   /* form array of columns we need */
350452661fSBarry Smith   garray = (int *) PetscMalloc( (ec+1)*sizeof(int) ); CHKPTRQ(garray);
361eb62cbbSBarry Smith   ec = 0;
371eb62cbbSBarry Smith   for ( i=0; i<N; i++ ) {
381eb62cbbSBarry Smith     if (indices[i]) garray[ec++] = i;
391eb62cbbSBarry Smith   }
401eb62cbbSBarry Smith 
411eb62cbbSBarry Smith   /* make indices now point into garray */
421eb62cbbSBarry Smith   for ( i=0; i<ec; i++ ) {
43dbb450caSBarry Smith     indices[garray[i]] = i-shift;
441eb62cbbSBarry Smith   }
451eb62cbbSBarry Smith 
461eb62cbbSBarry Smith   /* compact out the extra columns in B */
47d6dfbf8fSBarry Smith   for ( i=0; i<B->m; i++ ) {
48d6dfbf8fSBarry Smith     for ( j=0; j<B->ilen[i]; j++ ) {
49dbb450caSBarry Smith       aj[B->i[i] + shift + j] = indices[aj[B->i[i] + shift + j]+shift];
501eb62cbbSBarry Smith     }
51d6dfbf8fSBarry Smith   }
52639f9d9dSBarry Smith   B->n = aij->B->n = aij->B->N = ec;
530452661fSBarry Smith   PetscFree(indices);
541eb62cbbSBarry Smith 
551eb62cbbSBarry Smith   /* create local vector that is used to scatter into */
56fafbff53SBarry Smith   ierr = VecCreateSeq(MPI_COMM_SELF,ec,&aij->lvec); CHKERRQ(ierr);
571eb62cbbSBarry Smith 
58d6dfbf8fSBarry Smith   /* create two temporary Index sets for build scatter gather */
59537820f0SBarry Smith   ierr = ISCreateGeneral(MPI_COMM_SELF,ec,garray,&from); CHKERRQ(ierr);
60537820f0SBarry Smith   ierr = ISCreateStride(MPI_COMM_SELF,ec,0,1,&to); CHKERRQ(ierr);
611eb62cbbSBarry Smith 
621eb62cbbSBarry Smith   /* create temporary global vector to generate scatter context */
631eb62cbbSBarry Smith   /* this is inefficient, but otherwise we must do either
641eb62cbbSBarry Smith      1) save garray until the first actual scatter when the vector is known or
651eb62cbbSBarry Smith      2) have another way of generating a scatter context without a vector.*/
6678b31e54SBarry Smith   ierr = VecCreateMPI(mat->comm,aij->n,aij->N,&gvec); CHKERRQ(ierr);
671eb62cbbSBarry Smith 
682d336d48SLois Curfman McInnes   /* generate the scatter context */
6908480c60SBarry Smith   ierr = VecScatterCreate(gvec,from,aij->lvec,to,&aij->Mvctx); CHKERRQ(ierr);
70a5a9c739SBarry Smith   PLogObjectParent(mat,aij->Mvctx);
71a5a9c739SBarry Smith   PLogObjectParent(mat,aij->lvec);
72464493b3SBarry Smith   PLogObjectParent(mat,from);
73464493b3SBarry Smith   PLogObjectParent(mat,to);
749e25ed09SBarry Smith   aij->garray = garray;
75464493b3SBarry Smith   PLogObjectMemory(mat,(ec+1)*sizeof(int));
7678b31e54SBarry Smith   ierr = ISDestroy(from); CHKERRQ(ierr);
7778b31e54SBarry Smith   ierr = ISDestroy(to); CHKERRQ(ierr);
781eb62cbbSBarry Smith   ierr = VecDestroy(gvec);
798c79f6d3SBarry Smith   return 0;
808c79f6d3SBarry Smith }
819e25ed09SBarry Smith 
829e25ed09SBarry Smith 
83*5615d1e5SSatish Balay #undef __FUNC__
84*5615d1e5SSatish Balay #define __FUNC__ "DisAssemble_MPIAIJ"
852493cbb0SBarry Smith /*
862493cbb0SBarry Smith      Takes the local part of an already assembled MPIAIJ matrix
872493cbb0SBarry Smith    and disassembles it. This is to allow new nonzeros into the matrix
882493cbb0SBarry Smith    that require more communication in the matrix vector multiply.
892493cbb0SBarry Smith    Thus certain data-structures must be rebuilt.
902493cbb0SBarry Smith 
912493cbb0SBarry Smith    Kind of slow! But that's what application programmers get when
922493cbb0SBarry Smith    they are sloppy.
932493cbb0SBarry Smith */
942493cbb0SBarry Smith int DisAssemble_MPIAIJ(Mat A)
952493cbb0SBarry Smith {
962493cbb0SBarry Smith   Mat_MPIAIJ *aij = (Mat_MPIAIJ *) A->data;
972493cbb0SBarry Smith   Mat        B = aij->B,Bnew;
98ec8511deSBarry Smith   Mat_SeqAIJ *Baij = (Mat_SeqAIJ*)B->data;
992493cbb0SBarry Smith   int        ierr,i,j,m = Baij->m,n = aij->N,col,ct = 0,*garray = aij->garray;
100416022c9SBarry Smith   int        *nz,ec,shift = Baij->indexshift;
1012493cbb0SBarry Smith   Scalar     v;
1022493cbb0SBarry Smith 
1032493cbb0SBarry Smith   /* free stuff related to matrix-vec multiply */
104464493b3SBarry Smith   ierr = VecGetSize(aij->lvec,&ec); /* needed for PLogObjectMemory below */
1052493cbb0SBarry Smith   ierr = VecDestroy(aij->lvec); CHKERRQ(ierr); aij->lvec = 0;
10608480c60SBarry Smith   ierr = VecScatterDestroy(aij->Mvctx); CHKERRQ(ierr); aij->Mvctx = 0;
107464493b3SBarry Smith   if (aij->colmap) {
1080452661fSBarry Smith     PetscFree(aij->colmap); aij->colmap = 0;
109464493b3SBarry Smith     PLogObjectMemory(A,-Baij->n*sizeof(int));
110464493b3SBarry Smith   }
1112493cbb0SBarry Smith 
1122493cbb0SBarry Smith   /* make sure that B is assembled so we can access its values */
1136d4a8577SBarry Smith   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr);
114fe2f2677SBarry Smith   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr);
1152493cbb0SBarry Smith 
1162493cbb0SBarry Smith   /* invent new B and copy stuff over */
117639f9d9dSBarry Smith   nz = (int *) PetscMalloc( (m+1)*sizeof(int) ); CHKPTRQ(nz);
11848b35521SBarry Smith   for ( i=0; i<m; i++ ) {
11948b35521SBarry Smith     nz[i] = Baij->i[i+1] - Baij->i[i];
12048b35521SBarry Smith   }
121fafbff53SBarry Smith   ierr = MatCreateSeqAIJ(MPI_COMM_SELF,m,n,0,nz,&Bnew); CHKERRQ(ierr);
1220452661fSBarry Smith   PetscFree(nz);
1232493cbb0SBarry Smith   for ( i=0; i<m; i++ ) {
124dbb450caSBarry Smith     for ( j=Baij->i[i]+shift; j<Baij->i[i+1]+shift; j++ ) {
125dbb450caSBarry Smith       col = garray[Baij->j[ct]+shift];
1262493cbb0SBarry Smith       v = Baij->a[ct++];
127dbb450caSBarry Smith       ierr = MatSetValues(Bnew,1,&i,1,&col,&v,INSERT_VALUES); CHKERRQ(ierr);
1282493cbb0SBarry Smith     }
1292493cbb0SBarry Smith   }
1300452661fSBarry Smith   PetscFree(aij->garray); aij->garray = 0;
131464493b3SBarry Smith   PLogObjectMemory(A,-ec*sizeof(int));
1322493cbb0SBarry Smith   ierr = MatDestroy(B); CHKERRQ(ierr);
133464493b3SBarry Smith   PLogObjectParent(A,Bnew);
1342493cbb0SBarry Smith   aij->B = Bnew;
135227d817aSBarry Smith   A->was_assembled = PETSC_FALSE;
1362493cbb0SBarry Smith   return 0;
1372493cbb0SBarry Smith }
1382493cbb0SBarry Smith 
13948b35521SBarry Smith 
140