xref: /petsc/src/mat/impls/aij/mpi/mmaij.c (revision 0f5bd95cca42d693ada6d048329ab39533680180)
1a5eb4965SSatish Balay #ifdef PETSC_RCS_HEADER
2*0f5bd95cSBarry Smith static char vcid[] = "$Id: mmaij.c,v 1.48 1999/06/30 23:51:10 balay Exp bsmith $";
3cb512458SBarry Smith #endif
48c79f6d3SBarry Smith 
58c79f6d3SBarry Smith /*
68c79f6d3SBarry Smith    Support for the parallel AIJ matrix vector multiply
78c79f6d3SBarry Smith */
870f55243SBarry Smith #include "src/mat/impls/aij/mpi/mpiaij.h"
9f5eb4b81SSatish Balay #include "src/vec/vecimpl.h"
108c79f6d3SBarry Smith 
115615d1e5SSatish Balay #undef __FUNC__
125615d1e5SSatish Balay #define __FUNC__ "MatSetUpMultiply_MPIAIJ"
1344a69424SLois Curfman McInnes int MatSetUpMultiply_MPIAIJ(Mat mat)
148c79f6d3SBarry Smith {
1544a69424SLois Curfman McInnes   Mat_MPIAIJ         *aij = (Mat_MPIAIJ *) mat->data;
16ec8511deSBarry Smith   Mat_SeqAIJ         *B = (Mat_SeqAIJ *) (aij->B->data);
17416022c9SBarry Smith   int                N = aij->N,i,j,*indices,*aj = B->j,ierr,ec = 0,*garray;
18416022c9SBarry Smith   int                shift = B->indexshift;
191eb62cbbSBarry Smith   IS                 from,to;
201eb62cbbSBarry Smith   Vec                gvec;
21aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
22*0f5bd95cSBarry Smith   PetscTable         gid1_lid1;
23*0f5bd95cSBarry Smith   PetscTablePosition tpos;
242066d6f7SSatish Balay   int                gid, lid;
252066d6f7SSatish Balay #endif
262066d6f7SSatish Balay 
273a40ed3dSBarry Smith   PetscFunctionBegin;
282066d6f7SSatish Balay 
29aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
302066d6f7SSatish Balay   /* use a table - Mark Adams (this has not been tested with "shift") */
31*0f5bd95cSBarry Smith   PetscTableCreate(B->m,&gid1_lid1);
322066d6f7SSatish Balay   for ( i=0; i<B->m; i++ ) {
332066d6f7SSatish Balay     for ( j=0; j<B->ilen[i]; j++ ) {
3408c73f0fSSatish Balay       int data,gid1 = aj[B->i[i] + shift + j] + 1 + shift;
35*0f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr);
36fa46199cSSatish Balay       if (!data) {
372066d6f7SSatish Balay         /* one based table */
38*0f5bd95cSBarry Smith         ierr = PetscTableAdd(gid1_lid1,gid1,++ec);CHKERRQ(ierr);
392066d6f7SSatish Balay       }
402066d6f7SSatish Balay     }
412066d6f7SSatish Balay   }
422066d6f7SSatish Balay   /* form array of columns we need */
432066d6f7SSatish Balay   garray = (int *)PetscMalloc((ec+1)*sizeof(int));CHKPTRQ(garray);
44*0f5bd95cSBarry Smith   ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr);
452066d6f7SSatish Balay   while (tpos) {
46*0f5bd95cSBarry Smith     ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr);
472066d6f7SSatish Balay     gid--; lid--;
482066d6f7SSatish Balay     garray[lid] = gid;
492066d6f7SSatish Balay   }
500064e2bbSSatish Balay   ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */
510064e2bbSSatish Balay   /* qsort( garray, ec, sizeof(int), intcomparc ); */
52*0f5bd95cSBarry Smith   ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr);
532066d6f7SSatish Balay   for ( i=0; i<ec; i++ ) {
54*0f5bd95cSBarry Smith     ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1);CHKERRQ(ierr);
552066d6f7SSatish Balay   }
562066d6f7SSatish Balay   /* compact out the extra columns in B */
572066d6f7SSatish Balay   for ( i=0; i<B->m; i++ ) {
582066d6f7SSatish Balay     for ( j=0; j<B->ilen[i]; j++ ) {
5908c73f0fSSatish Balay       int gid1 = aj[B->i[i] + shift + j] + 1 + shift;
60*0f5bd95cSBarry Smith       ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr);
61fa46199cSSatish Balay       lid --;
6208c73f0fSSatish Balay       aj[B->i[i] + shift + j]  = lid - shift;
632066d6f7SSatish Balay     }
642066d6f7SSatish Balay   }
652066d6f7SSatish Balay   B->n = aij->B->n = aij->B->N = ec;
66*0f5bd95cSBarry Smith   ierr = PetscTableDelete(gid1_lid1);CHKERRQ(ierr);
672066d6f7SSatish Balay   /* Mark Adams */
682066d6f7SSatish Balay #else
698c79f6d3SBarry Smith   /* For the first stab we make an array as long as the number of columns */
701eb62cbbSBarry Smith   /* mark those columns that are in aij->B */
71ac03b0baSBarry Smith   indices = (int *) PetscMalloc( (N+1)*sizeof(int) );CHKPTRQ(indices);
72549d3d68SSatish Balay   ierr = PetscMemzero(indices,N*sizeof(int));CHKERRQ(ierr);
73d6dfbf8fSBarry Smith   for ( i=0; i<B->m; i++ ) {
74d6dfbf8fSBarry Smith     for ( j=0; j<B->ilen[i]; j++ ) {
75dbb450caSBarry Smith       if (!indices[aj[B->i[i] +shift + j] + shift]) ec++;
76416022c9SBarry Smith       indices[aj[B->i[i] + shift + j] + shift] = 1;
77416022c9SBarry Smith     }
781eb62cbbSBarry Smith   }
798c79f6d3SBarry Smith 
801eb62cbbSBarry Smith   /* form array of columns we need */
810452661fSBarry Smith   garray = (int *) PetscMalloc( (ec+1)*sizeof(int) );CHKPTRQ(garray);
821eb62cbbSBarry Smith   ec = 0;
831eb62cbbSBarry Smith   for ( i=0; i<N; i++ ) {
841eb62cbbSBarry Smith     if (indices[i]) garray[ec++] = i;
851eb62cbbSBarry Smith   }
861eb62cbbSBarry Smith 
871eb62cbbSBarry Smith   /* make indices now point into garray */
881eb62cbbSBarry Smith   for ( i=0; i<ec; i++ ) {
89dbb450caSBarry Smith     indices[garray[i]] = i-shift;
901eb62cbbSBarry Smith   }
911eb62cbbSBarry Smith 
921eb62cbbSBarry Smith   /* compact out the extra columns in B */
93d6dfbf8fSBarry Smith   for ( i=0; i<B->m; i++ ) {
94d6dfbf8fSBarry Smith     for ( j=0; j<B->ilen[i]; j++ ) {
95dbb450caSBarry Smith       aj[B->i[i] + shift + j] = indices[aj[B->i[i] + shift + j]+shift];
961eb62cbbSBarry Smith     }
97d6dfbf8fSBarry Smith   }
98639f9d9dSBarry Smith   B->n = aij->B->n = aij->B->N = ec;
99606d414cSSatish Balay   ierr = PetscFree(indices);CHKERRQ(ierr);
1002066d6f7SSatish Balay #endif
1011eb62cbbSBarry Smith   /* create local vector that is used to scatter into */
102029af93fSBarry Smith   ierr = VecCreateSeq(PETSC_COMM_SELF,ec,&aij->lvec);CHKERRQ(ierr);
1031eb62cbbSBarry Smith 
104d6dfbf8fSBarry Smith   /* create two temporary Index sets for build scatter gather */
105029af93fSBarry Smith   ierr = ISCreateGeneral(PETSC_COMM_SELF,ec,garray,&from);CHKERRQ(ierr);
106029af93fSBarry Smith   ierr = ISCreateStride(PETSC_COMM_SELF,ec,0,1,&to);CHKERRQ(ierr);
1071eb62cbbSBarry Smith 
1081eb62cbbSBarry Smith   /* create temporary global vector to generate scatter context */
1091eb62cbbSBarry Smith   /* this is inefficient, but otherwise we must do either
1101eb62cbbSBarry Smith      1) save garray until the first actual scatter when the vector is known or
1111eb62cbbSBarry Smith      2) have another way of generating a scatter context without a vector.*/
11278b31e54SBarry Smith   ierr = VecCreateMPI(mat->comm,aij->n,aij->N,&gvec);CHKERRQ(ierr);
1131eb62cbbSBarry Smith 
1142d336d48SLois Curfman McInnes   /* generate the scatter context */
11508480c60SBarry Smith   ierr = VecScatterCreate(gvec,from,aij->lvec,to,&aij->Mvctx);CHKERRQ(ierr);
116a5a9c739SBarry Smith   PLogObjectParent(mat,aij->Mvctx);
117a5a9c739SBarry Smith   PLogObjectParent(mat,aij->lvec);
118464493b3SBarry Smith   PLogObjectParent(mat,from);
119464493b3SBarry Smith   PLogObjectParent(mat,to);
1209e25ed09SBarry Smith   aij->garray = garray;
121464493b3SBarry Smith   PLogObjectMemory(mat,(ec+1)*sizeof(int));
12278b31e54SBarry Smith   ierr = ISDestroy(from);CHKERRQ(ierr);
12378b31e54SBarry Smith   ierr = ISDestroy(to);CHKERRQ(ierr);
124888f2ed8SSatish Balay   ierr = VecDestroy(gvec);CHKERRQ(ierr);
1253a40ed3dSBarry Smith   PetscFunctionReturn(0);
1268c79f6d3SBarry Smith }
1279e25ed09SBarry Smith 
1289e25ed09SBarry Smith 
1295615d1e5SSatish Balay #undef __FUNC__
1305615d1e5SSatish Balay #define __FUNC__ "DisAssemble_MPIAIJ"
1312493cbb0SBarry Smith /*
1322493cbb0SBarry Smith      Takes the local part of an already assembled MPIAIJ matrix
1332493cbb0SBarry Smith    and disassembles it. This is to allow new nonzeros into the matrix
1342493cbb0SBarry Smith    that require more communication in the matrix vector multiply.
1352493cbb0SBarry Smith    Thus certain data-structures must be rebuilt.
1362493cbb0SBarry Smith 
1372493cbb0SBarry Smith    Kind of slow! But that's what application programmers get when
1382493cbb0SBarry Smith    they are sloppy.
1392493cbb0SBarry Smith */
1402493cbb0SBarry Smith int DisAssemble_MPIAIJ(Mat A)
1412493cbb0SBarry Smith {
1422493cbb0SBarry Smith   Mat_MPIAIJ *aij = (Mat_MPIAIJ *) A->data;
1432493cbb0SBarry Smith   Mat        B = aij->B,Bnew;
144ec8511deSBarry Smith   Mat_SeqAIJ *Baij = (Mat_SeqAIJ*)B->data;
1452493cbb0SBarry Smith   int        ierr,i,j,m = Baij->m,n = aij->N,col,ct = 0,*garray = aij->garray;
146416022c9SBarry Smith   int        *nz,ec,shift = Baij->indexshift;
1472493cbb0SBarry Smith   Scalar     v;
1482493cbb0SBarry Smith 
1493a40ed3dSBarry Smith   PetscFunctionBegin;
1502493cbb0SBarry Smith   /* free stuff related to matrix-vec multiply */
151888f2ed8SSatish Balay   ierr = VecGetSize(aij->lvec,&ec);CHKERRQ(ierr); /* needed for PLogObjectMemory below */
1522493cbb0SBarry Smith   ierr = VecDestroy(aij->lvec);CHKERRQ(ierr); aij->lvec = 0;
15308480c60SBarry Smith   ierr = VecScatterDestroy(aij->Mvctx);CHKERRQ(ierr); aij->Mvctx = 0;
154464493b3SBarry Smith   if (aij->colmap) {
155aa482453SBarry Smith #if defined (PETSC_USE_CTABLE)
156*0f5bd95cSBarry Smith     ierr = PetscTableDelete(aij->colmap); CHKERRQ(ierr);
157*0f5bd95cSBarry Smith     aij->colmap = 0;
1582066d6f7SSatish Balay #else
159606d414cSSatish Balay     ierr = PetscFree(aij->colmap);CHKERRQ(ierr);
160606d414cSSatish Balay     aij->colmap = 0;
161464493b3SBarry Smith     PLogObjectMemory(A,-Baij->n*sizeof(int));
1622066d6f7SSatish Balay #endif
163464493b3SBarry Smith   }
1642493cbb0SBarry Smith 
1652493cbb0SBarry Smith   /* make sure that B is assembled so we can access its values */
1666d4a8577SBarry Smith   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
167fe2f2677SBarry Smith   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1682493cbb0SBarry Smith 
1692493cbb0SBarry Smith   /* invent new B and copy stuff over */
170639f9d9dSBarry Smith   nz = (int *) PetscMalloc( (m+1)*sizeof(int) );CHKPTRQ(nz);
17148b35521SBarry Smith   for ( i=0; i<m; i++ ) {
17248b35521SBarry Smith     nz[i] = Baij->i[i+1] - Baij->i[i];
17348b35521SBarry Smith   }
174029af93fSBarry Smith   ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,m,n,0,nz,&Bnew);CHKERRQ(ierr);
175606d414cSSatish Balay   ierr = PetscFree(nz);CHKERRQ(ierr);
1762493cbb0SBarry Smith   for ( i=0; i<m; i++ ) {
177dbb450caSBarry Smith     for ( j=Baij->i[i]+shift; j<Baij->i[i+1]+shift; j++ ) {
178dbb450caSBarry Smith       col  = garray[Baij->j[ct]+shift];
1792493cbb0SBarry Smith       v    = Baij->a[ct++];
18083271157SBarry Smith       ierr = MatSetValues(Bnew,1,&i,1,&col,&v,B->insertmode);CHKERRQ(ierr);
1812493cbb0SBarry Smith     }
1822493cbb0SBarry Smith   }
183606d414cSSatish Balay   ierr = PetscFree(aij->garray);CHKERRQ(ierr);
184606d414cSSatish Balay   aij->garray = 0;
185464493b3SBarry Smith   PLogObjectMemory(A,-ec*sizeof(int));
1862493cbb0SBarry Smith   ierr = MatDestroy(B);CHKERRQ(ierr);
187464493b3SBarry Smith   PLogObjectParent(A,Bnew);
1882493cbb0SBarry Smith   aij->B = Bnew;
189227d817aSBarry Smith   A->was_assembled = PETSC_FALSE;
1903a40ed3dSBarry Smith   PetscFunctionReturn(0);
1912493cbb0SBarry Smith }
1922493cbb0SBarry Smith 
19348b35521SBarry Smith 
194