1cac129eeSSatish Balay #ifndef lint 2*70f55243SBarry Smith static char vcid[] = "$Id: baij2.c,v 1.6 1996/08/06 04:02:46 bsmith Exp bsmith $"; 3cac129eeSSatish Balay #endif 4cac129eeSSatish Balay 5*70f55243SBarry Smith #include "src/mat/impls/baij/seq/baij.h" 6cac129eeSSatish Balay #include "petsc.h" 7736121d4SSatish Balay #include "src/inline/bitarray.h" 8cac129eeSSatish Balay 9736121d4SSatish Balay int MatIncreaseOverlap_SeqBAIJ(Mat A,int is_max,IS *is,int ov) 10a3192f15SSatish Balay { 11a3192f15SSatish Balay Mat_SeqBAIJ *a = (Mat_SeqBAIJ *) A->data; 12218c64b6SSatish Balay int row, i,j,k,l,m,n, *idx,ierr, *nidx, isz, val, ival; 13218c64b6SSatish Balay int start, end, *ai, *aj,bs,*nidx2; 14a3192f15SSatish Balay char *table; 15a3192f15SSatish Balay 16a3192f15SSatish Balay m = a->mbs; 17a3192f15SSatish Balay ai = a->i; 18a3192f15SSatish Balay aj = a->j; 19218c64b6SSatish Balay bs = a->bs; 20a3192f15SSatish Balay 21a3192f15SSatish Balay if (ov < 0) SETERRQ(1,"MatIncreaseOverlap_SeqBAIJ: illegal overlap value used"); 22a3192f15SSatish Balay 23a3192f15SSatish Balay table = (char *) PetscMalloc((m/BITSPERBYTE +1)*sizeof(char)); CHKPTRQ(table); 24a3192f15SSatish Balay nidx = (int *) PetscMalloc((m+1)*sizeof(int)); CHKPTRQ(nidx); 25218c64b6SSatish Balay nidx2 = (int *)PetscMalloc((a->m+1)*sizeof(int)); CHKPTRQ(nidx2); 26a3192f15SSatish Balay 27a3192f15SSatish Balay for ( i=0; i<is_max; i++ ) { 28a3192f15SSatish Balay /* Initialise the two local arrays */ 29a3192f15SSatish Balay isz = 0; 30a3192f15SSatish Balay PetscMemzero(table,(m/BITSPERBYTE +1)*sizeof(char)); 31a3192f15SSatish Balay 32a3192f15SSatish Balay /* Extract the indices, assume there can be duplicate entries */ 33a3192f15SSatish Balay ierr = ISGetIndices(is[i],&idx); CHKERRQ(ierr); 34a3192f15SSatish Balay ierr = ISGetSize(is[i],&n); CHKERRQ(ierr); 35a3192f15SSatish Balay 36a3192f15SSatish Balay /* Enter these into the temp arrays i.e mark table[row], enter row into new index */ 37a3192f15SSatish Balay for ( j=0; j<n ; ++j){ 38218c64b6SSatish Balay ival = idx[j]/bs; /* convert the indices into block indices */ 39218c64b6SSatish Balay if (ival>m) SETERRQ(1,"MatIncreaseOverlap_SeqBAIJ: index greater than mat-dim"); 40218c64b6SSatish Balay if(!BT_LOOKUP(table, ival)) { nidx[isz++] = ival;} 41a3192f15SSatish Balay } 42a3192f15SSatish Balay ierr = ISRestoreIndices(is[i],&idx); CHKERRQ(ierr); 43a3192f15SSatish Balay ierr = ISDestroy(is[i]); CHKERRQ(ierr); 44a3192f15SSatish Balay 45a3192f15SSatish Balay k = 0; 46a3192f15SSatish Balay for ( j=0; j<ov; j++){ /* for each overlap*/ 47a3192f15SSatish Balay n = isz; 48a3192f15SSatish Balay for ( ; k<n ; k++){ /* do only those rows in nidx[k], which are not done yet */ 49a3192f15SSatish Balay row = nidx[k]; 50a3192f15SSatish Balay start = ai[row]; 51a3192f15SSatish Balay end = ai[row+1]; 52a3192f15SSatish Balay for ( l = start; l<end ; l++){ 53a3192f15SSatish Balay val = aj[l]; 54a3192f15SSatish Balay if (!BT_LOOKUP(table,val)) {nidx[isz++] = val;} 55a3192f15SSatish Balay } 56a3192f15SSatish Balay } 57a3192f15SSatish Balay } 58218c64b6SSatish Balay /* expand the Index Set */ 59218c64b6SSatish Balay for (j=0; j<isz; j++ ) { 60218c64b6SSatish Balay for (k=0; k<bs; k++ ) 61218c64b6SSatish Balay nidx2[j*bs+k] = nidx[j]*bs+k; 62218c64b6SSatish Balay } 63218c64b6SSatish Balay ierr = ISCreateSeq(MPI_COMM_SELF, isz*bs, nidx2, (is+i)); CHKERRQ(ierr); 64a3192f15SSatish Balay } 65a3192f15SSatish Balay PetscFree(table); 66a3192f15SSatish Balay PetscFree(nidx); 67218c64b6SSatish Balay PetscFree(nidx2); 68a3192f15SSatish Balay return 0; 69a3192f15SSatish Balay } 70218c64b6SSatish Balay int MatGetSubMatrix_SeqBAIJ_Private(Mat A,IS isrow,IS iscol,MatGetSubMatrixCall scall,Mat *B) 71736121d4SSatish Balay { 72736121d4SSatish Balay Mat_SeqBAIJ *a = (Mat_SeqBAIJ *) A->data,*c; 73736121d4SSatish Balay int nznew, *smap, i, k, kstart, kend, ierr, oldcols = a->nbs,*lens; 74218c64b6SSatish Balay int row,mat_i,*mat_j,tcol,*mat_ilen; 75736121d4SSatish Balay int *irow, *icol, nrows, ncols,*ssmap,bs=a->bs, bs2=a->bs2; 76218c64b6SSatish Balay int *aj = a->j, *ai = a->i; 77218c64b6SSatish Balay Scalar *mat_a; 78736121d4SSatish Balay Mat C; 79736121d4SSatish Balay 80736121d4SSatish Balay ierr = ISSorted(iscol,(PetscTruth*)&i); 81736121d4SSatish Balay if (!i) SETERRQ(1,"MatGetSubmatrices_SeqBAIJ:IS is not sorted"); 82736121d4SSatish Balay 83736121d4SSatish Balay ierr = ISGetIndices(isrow,&irow); CHKERRQ(ierr); 84218c64b6SSatish Balay ierr = ISGetIndices(iscol,&icol); CHKERRQ(ierr); 85736121d4SSatish Balay ierr = ISGetSize(isrow,&nrows); CHKERRQ(ierr); 86736121d4SSatish Balay ierr = ISGetSize(iscol,&ncols); CHKERRQ(ierr); 87736121d4SSatish Balay 88736121d4SSatish Balay smap = (int *) PetscMalloc((1+oldcols)*sizeof(int)); CHKPTRQ(smap); 89736121d4SSatish Balay ssmap = smap; 90736121d4SSatish Balay lens = (int *) PetscMalloc((1+nrows)*sizeof(int)); CHKPTRQ(lens); 91736121d4SSatish Balay PetscMemzero(smap,oldcols*sizeof(int)); 92736121d4SSatish Balay for ( i=0; i<ncols; i++ ) smap[icol[i]] = i+1; 93736121d4SSatish Balay /* determine lens of each row */ 94736121d4SSatish Balay for (i=0; i<nrows; i++) { 95736121d4SSatish Balay kstart = ai[irow[i]]; 96736121d4SSatish Balay kend = kstart + a->ilen[irow[i]]; 97736121d4SSatish Balay lens[i] = 0; 98736121d4SSatish Balay for ( k=kstart; k<kend; k++ ) { 99736121d4SSatish Balay if (ssmap[aj[k]]) { 100736121d4SSatish Balay lens[i]++; 101736121d4SSatish Balay } 102736121d4SSatish Balay } 103736121d4SSatish Balay } 104736121d4SSatish Balay /* Create and fill new matrix */ 105736121d4SSatish Balay if (scall == MAT_REUSE_MATRIX) { 106736121d4SSatish Balay c = (Mat_SeqBAIJ *)((*B)->data); 107736121d4SSatish Balay 108736121d4SSatish Balay if (c->mbs!=nrows || c->nbs!=ncols || c->bs!=bs) 109736121d4SSatish Balay SETERRQ(1,"MatGetSubMatrix_SeqBAIJ:"); 110736121d4SSatish Balay if (PetscMemcmp(c->ilen,lens, c->mbs *sizeof(int))) { 111736121d4SSatish Balay SETERRQ(1,"MatGetSubmatrix_SeqBAIJ:Cannot reuse matrix. wrong no of nonzeros"); 112736121d4SSatish Balay } 113736121d4SSatish Balay PetscMemzero(c->ilen,c->mbs*sizeof(int)); 114736121d4SSatish Balay C = *B; 115736121d4SSatish Balay } 116736121d4SSatish Balay else { 117736121d4SSatish Balay ierr = MatCreateSeqBAIJ(A->comm,bs,nrows*bs,ncols*bs,0,lens,&C);CHKERRQ(ierr); 118736121d4SSatish Balay } 119736121d4SSatish Balay c = (Mat_SeqBAIJ *)(C->data); 120736121d4SSatish Balay for (i=0; i<nrows; i++) { 121736121d4SSatish Balay row = irow[i]; 122736121d4SSatish Balay nznew = 0; 123736121d4SSatish Balay kstart = ai[row]; 124736121d4SSatish Balay kend = kstart + a->ilen[row]; 125736121d4SSatish Balay mat_i = c->i[i]; 126736121d4SSatish Balay mat_j = c->j + mat_i; 127218c64b6SSatish Balay mat_a = c->a + mat_i*bs2; 128736121d4SSatish Balay mat_ilen = c->ilen + i; 129736121d4SSatish Balay for ( k=kstart; k<kend; k++ ) { 130736121d4SSatish Balay if ((tcol=ssmap[a->j[k]])) { 131736121d4SSatish Balay *mat_j++ = tcol - 1; 132736121d4SSatish Balay PetscMemcpy(mat_a,a->a+k*bs2,bs2*sizeof(Scalar)); mat_a+=bs2; 133736121d4SSatish Balay (*mat_ilen)++; 134736121d4SSatish Balay 135736121d4SSatish Balay } 136736121d4SSatish Balay } 137736121d4SSatish Balay } 138218c64b6SSatish Balay 139736121d4SSatish Balay /* Free work space */ 140736121d4SSatish Balay ierr = ISRestoreIndices(iscol,&icol); CHKERRQ(ierr); 141736121d4SSatish Balay PetscFree(smap); PetscFree(lens); 1426d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr); 1436d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr); 144736121d4SSatish Balay 145736121d4SSatish Balay ierr = ISRestoreIndices(isrow,&irow); CHKERRQ(ierr); 146736121d4SSatish Balay *B = C; 147736121d4SSatish Balay return 0; 148736121d4SSatish Balay } 149736121d4SSatish Balay 150218c64b6SSatish Balay int MatGetSubMatrix_SeqBAIJ(Mat A,IS isrow,IS iscol,MatGetSubMatrixCall scall,Mat *B) 151218c64b6SSatish Balay { 152218c64b6SSatish Balay Mat_SeqBAIJ *a = (Mat_SeqBAIJ *) A->data; 153218c64b6SSatish Balay IS is1,is2; 154218c64b6SSatish Balay int *vary,*iary,*irow,*icol,nrows,ncols,i,ierr,bs=a->bs,count; 155218c64b6SSatish Balay 156218c64b6SSatish Balay ierr = ISGetIndices(isrow,&irow); CHKERRQ(ierr); 157218c64b6SSatish Balay ierr = ISGetIndices(iscol,&icol); CHKERRQ(ierr); 158218c64b6SSatish Balay ierr = ISGetSize(isrow,&nrows); CHKERRQ(ierr); 159218c64b6SSatish Balay ierr = ISGetSize(iscol,&ncols); CHKERRQ(ierr); 160218c64b6SSatish Balay 161218c64b6SSatish Balay /* Verify if the indices corespond to each elementin a block 162218c64b6SSatish Balay and form the IS with compressed IS */ 163218c64b6SSatish Balay vary = (int *) PetscMalloc(2*(a->mbs+1)*sizeof(int)); CHKPTRQ(vary); 164218c64b6SSatish Balay iary = vary + a->mbs; 165218c64b6SSatish Balay PetscMemzero(vary,(a->mbs)*sizeof(int)); 166218c64b6SSatish Balay for ( i=0; i<nrows; i++) vary[irow[i]/bs]++; 167218c64b6SSatish Balay count = 0; 168218c64b6SSatish Balay for (i=0; i<a->mbs; i++) { 169218c64b6SSatish Balay if (vary[i]!=0 && vary[i]!=bs) SETERRA(1,"MatGetSubmatrices_SeqBAIJ:"); 170218c64b6SSatish Balay if (vary[i]==bs) iary[count++] = i; 171218c64b6SSatish Balay } 172218c64b6SSatish Balay ierr = ISCreateSeq(MPI_COMM_SELF, count, iary,&is1); CHKERRQ(ierr); 173218c64b6SSatish Balay 174218c64b6SSatish Balay PetscMemzero(vary,(a->mbs)*sizeof(int)); 175218c64b6SSatish Balay for ( i=0; i<ncols; i++) vary[icol[i]/bs]++; 176218c64b6SSatish Balay count = 0; 177218c64b6SSatish Balay for (i=0; i<a->mbs; i++) { 178218c64b6SSatish Balay if (vary[i]!=0 && vary[i]!=bs) SETERRA(1,"MatGetSubmatrices_SeqBAIJ:"); 179218c64b6SSatish Balay if (vary[i]==bs) iary[count++] = i; 180218c64b6SSatish Balay } 181218c64b6SSatish Balay ierr = ISCreateSeq(MPI_COMM_SELF, count, iary,&is2); CHKERRQ(ierr); 182218c64b6SSatish Balay ierr = ISRestoreIndices(isrow,&irow); CHKERRQ(ierr); 183218c64b6SSatish Balay ierr = ISRestoreIndices(iscol,&icol); CHKERRQ(ierr); 184218c64b6SSatish Balay PetscFree(vary); 185218c64b6SSatish Balay 186218c64b6SSatish Balay ierr = MatGetSubMatrix_SeqBAIJ_Private(A,is1,is2,scall,B); CHKERRQ(ierr); 187218c64b6SSatish Balay ISDestroy(is1); 188218c64b6SSatish Balay ISDestroy(is2); 189218c64b6SSatish Balay return 0; 190218c64b6SSatish Balay } 191218c64b6SSatish Balay 192905e6a2fSBarry Smith extern int MatGetSubMatrix_SeqBAIJ(Mat,IS,IS,MatGetSubMatrixCall,Mat*); 193905e6a2fSBarry Smith 194736121d4SSatish Balay int MatGetSubMatrices_SeqBAIJ(Mat A,int n, IS *irow,IS *icol,MatGetSubMatrixCall scall, 195736121d4SSatish Balay Mat **B) 196736121d4SSatish Balay { 197736121d4SSatish Balay int ierr,i; 198736121d4SSatish Balay 199736121d4SSatish Balay if (scall == MAT_INITIAL_MATRIX) { 200736121d4SSatish Balay *B = (Mat *) PetscMalloc( (n+1)*sizeof(Mat) ); CHKPTRQ(*B); 201736121d4SSatish Balay } 202736121d4SSatish Balay 203736121d4SSatish Balay for ( i=0; i<n; i++ ) { 204905e6a2fSBarry Smith ierr = MatGetSubMatrix_SeqBAIJ(A,irow[i],icol[i],scall,&(*B)[i]);CHKERRQ(ierr); 205736121d4SSatish Balay } 206736121d4SSatish Balay return 0; 207736121d4SSatish Balay } 208218c64b6SSatish Balay 209218c64b6SSatish Balay 210218c64b6SSatish Balay 211218c64b6SSatish Balay 212218c64b6SSatish Balay 213218c64b6SSatish Balay 214218c64b6SSatish Balay 215