159557b74SHong Zhang /*$Id: aijsbaij.c,v 1.9 2001/08/07 03:02:55 balay Exp $*/ 259557b74SHong Zhang 359557b74SHong Zhang #include "src/mat/impls/aij/seq/aij.h" 4861ba921SHong Zhang #include "src/mat/impls/sbaij/seq/sbaij.h" 559557b74SHong Zhang 659557b74SHong Zhang EXTERN_C_BEGIN 759557b74SHong Zhang #undef __FUNCT__ 84e5e7fe4SHong Zhang #define __FUNCT__ "MatConvert_SeqSBAI_SeqAIJ" 94e5e7fe4SHong Zhang int MatConvert_SeqSBAIJ_SeqAIJ(Mat A,const MatType newtype,Mat *newmat) 104e5e7fe4SHong Zhang { 114e5e7fe4SHong Zhang Mat B; 124e5e7fe4SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 134e5e7fe4SHong Zhang Mat_SeqAIJ *b; 14*a7a3a9ebSHong Zhang int ierr,*ai=a->i,*aj=a->j,m=A->m,n=A->n,i,j,k,*bi,*bj, 15*a7a3a9ebSHong Zhang *rowlengths,nz,*rowstart,itmp; 16*a7a3a9ebSHong Zhang int bs=a->bs,bs2=bs*bs,mbs=A->m/bs; 174e5e7fe4SHong Zhang PetscScalar *av,*bv; 184e5e7fe4SHong Zhang 194e5e7fe4SHong Zhang PetscFunctionBegin; 20*a7a3a9ebSHong Zhang 214e5e7fe4SHong Zhang /* compute rowlengths of newmat */ 22*a7a3a9ebSHong Zhang ierr = PetscMalloc((2*m+1)*sizeof(int),&rowlengths);CHKERRQ(ierr); 23*a7a3a9ebSHong Zhang rowstart = rowlengths + m; 24*a7a3a9ebSHong Zhang 25*a7a3a9ebSHong Zhang for (i=0; i<mbs; i++) rowlengths[i*bs] = 0; 264e5e7fe4SHong Zhang aj = a->j; 27*a7a3a9ebSHong Zhang k = 0; 28*a7a3a9ebSHong Zhang for (i=0; i<mbs; i++) { 294e5e7fe4SHong Zhang nz = ai[i+1] - ai[i]; 30*a7a3a9ebSHong Zhang aj++; /* skip diagonal */ 31*a7a3a9ebSHong Zhang for (j=1; j<nz; j++) { /* no. of lower triangular blocks */ 32*a7a3a9ebSHong Zhang rowlengths[(*aj)*bs]++; aj++; 33*a7a3a9ebSHong Zhang } 34*a7a3a9ebSHong Zhang rowlengths[k] += nz; /* no. of upper triangular blocks */ 35*a7a3a9ebSHong Zhang rowlengths[k] *= bs; 36*a7a3a9ebSHong Zhang for (j=1; j<bs; j++) { 37*a7a3a9ebSHong Zhang rowlengths[k+j] = rowlengths[k]; 38*a7a3a9ebSHong Zhang } 39*a7a3a9ebSHong Zhang k += bs; 40*a7a3a9ebSHong Zhang /* printf(" rowlengths[%d]: %d\n",i, rowlengths[i]); */ 414e5e7fe4SHong Zhang } 424e5e7fe4SHong Zhang 43*a7a3a9ebSHong Zhang ierr = MatCreateSeqAIJ(PETSC_COMM_SELF,m,n,0,rowlengths,&B);CHKERRQ(ierr); 44*a7a3a9ebSHong Zhang ierr = MatSetOption(B,MAT_COLUMN_ORIENTED);CHKERRQ(ierr); 454e5e7fe4SHong Zhang ierr = MatSetOption(B,MAT_ROWS_SORTED);CHKERRQ(ierr); 464e5e7fe4SHong Zhang ierr = MatSetOption(B,MAT_COLUMNS_SORTED);CHKERRQ(ierr); 474e5e7fe4SHong Zhang 484e5e7fe4SHong Zhang b = (Mat_SeqAIJ*)(B->data); 494e5e7fe4SHong Zhang bi = b->i; 504e5e7fe4SHong Zhang bj = b->j; 514e5e7fe4SHong Zhang bv = b->a; 524e5e7fe4SHong Zhang 534e5e7fe4SHong Zhang /* set b->i */ 54*a7a3a9ebSHong Zhang bi[0] = 0; rowstart[0] = 0; 55*a7a3a9ebSHong Zhang for (i=0; i<mbs; i++){ 56*a7a3a9ebSHong Zhang for (j=0; j<bs; j++){ 57*a7a3a9ebSHong Zhang b->ilen[i*bs+j] = rowlengths[i*bs]; 58*a7a3a9ebSHong Zhang rowstart[i*bs+j+1] = rowstart[i*bs+j] + rowlengths[i*bs]; 594e5e7fe4SHong Zhang } 60*a7a3a9ebSHong Zhang bi[i+1] = bi[i] + rowlengths[i*bs]/bs; 61*a7a3a9ebSHong Zhang } 62*a7a3a9ebSHong Zhang if (bi[mbs] != 2*a->nz - mbs) SETERRQ2(1,"bi[mbs]: %d != 2*a->nz-mbs: %d\n",bi[mbs],2*a->nz - mbs); 634e5e7fe4SHong Zhang 644e5e7fe4SHong Zhang /* set b->j and b->a */ 654e5e7fe4SHong Zhang aj = a->j; av = a->a; 66*a7a3a9ebSHong Zhang for (i=0; i<mbs; i++) { 67*a7a3a9ebSHong Zhang /* diagonal block */ 68*a7a3a9ebSHong Zhang for (j=0; j<bs; j++){ /* row i*bs+j */ 69*a7a3a9ebSHong Zhang itmp = i*bs+j; 70*a7a3a9ebSHong Zhang for (k=0; k<bs; k++){ /* col i*bs+k */ 71*a7a3a9ebSHong Zhang *(bj + rowstart[itmp]) = (*aj)*bs+k; 72*a7a3a9ebSHong Zhang *(bv + rowstart[itmp]) = *(av+k*bs+j); 73*a7a3a9ebSHong Zhang rowstart[itmp]++; 74*a7a3a9ebSHong Zhang } 75*a7a3a9ebSHong Zhang } 76*a7a3a9ebSHong Zhang aj++; av += bs2; 77*a7a3a9ebSHong Zhang 784e5e7fe4SHong Zhang nz = ai[i+1] - ai[i] -1; 794e5e7fe4SHong Zhang while (nz--){ 80*a7a3a9ebSHong Zhang /* lower triangular blocks */ 81*a7a3a9ebSHong Zhang for (j=0; j<bs; j++){ /* row (*aj)*bs+j */ 82*a7a3a9ebSHong Zhang itmp = (*aj)*bs+j; 83*a7a3a9ebSHong Zhang for (k=0; k<bs; k++){ /* col i*bs+k */ 84*a7a3a9ebSHong Zhang *(bj + rowstart[itmp]) = i*bs+k; 85*a7a3a9ebSHong Zhang *(bv + rowstart[itmp]) = *(av+k*bs+j); 86*a7a3a9ebSHong Zhang rowstart[itmp]++; 87*a7a3a9ebSHong Zhang } 88*a7a3a9ebSHong Zhang } 89*a7a3a9ebSHong Zhang /* upper triangular blocks */ 90*a7a3a9ebSHong Zhang for (j=0; j<bs; j++){ /* row i*bs+j */ 91*a7a3a9ebSHong Zhang itmp = i*bs+j; 92*a7a3a9ebSHong Zhang for (k=0; k<bs; k++){ /* col (*aj)*bs+k */ 93*a7a3a9ebSHong Zhang *(bj + rowstart[itmp]) = (*aj)*bs+k; 94*a7a3a9ebSHong Zhang *(bv + rowstart[itmp]) = *(av+k*bs+j); 95*a7a3a9ebSHong Zhang rowstart[itmp]++; 96*a7a3a9ebSHong Zhang } 97*a7a3a9ebSHong Zhang } 98*a7a3a9ebSHong Zhang aj++; av += bs2; 994e5e7fe4SHong Zhang } 1004e5e7fe4SHong Zhang } 1014e5e7fe4SHong Zhang ierr = PetscFree(rowlengths);CHKERRQ(ierr); 1024e5e7fe4SHong Zhang ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1034e5e7fe4SHong Zhang ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1044e5e7fe4SHong Zhang 1054e5e7fe4SHong Zhang /* Fake support for "inplace" convert. */ 1064e5e7fe4SHong Zhang if (*newmat == A) { 1074e5e7fe4SHong Zhang ierr = MatDestroy(A);CHKERRQ(ierr); 1084e5e7fe4SHong Zhang } 1094e5e7fe4SHong Zhang *newmat = B; 1104e5e7fe4SHong Zhang PetscFunctionReturn(0); 1114e5e7fe4SHong Zhang } 1124e5e7fe4SHong Zhang #undef __FUNCT__ 11359557b74SHong Zhang #define __FUNCT__ "MatConvert_SeqAIJ_SeqSBAIJ" 1148e9aea5cSBarry Smith int MatConvert_SeqAIJ_SeqSBAIJ(Mat A,const MatType newtype,Mat *newmat) { 115676c34cdSKris Buschelman Mat B; 11659557b74SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 117861ba921SHong Zhang Mat_SeqSBAIJ *b; 118861ba921SHong Zhang int ierr,*ai=a->i,*aj,m=A->M,n=A->N,i,j, 1192d9a3abdSHong Zhang *bi,*bj,*rowlengths; 120861ba921SHong Zhang PetscScalar *av,*bv; 12159557b74SHong Zhang 12259557b74SHong Zhang PetscFunctionBegin; 1232d9a3abdSHong Zhang if (n != m) SETERRQ(PETSC_ERR_ARG_WRONG,"Matrix must be square"); 12459557b74SHong Zhang if (!a->diag){ 12559557b74SHong Zhang ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 12659557b74SHong Zhang } 12759557b74SHong Zhang 12859557b74SHong Zhang ierr = PetscMalloc(m*sizeof(int),&rowlengths);CHKERRQ(ierr); 12959557b74SHong Zhang for (i=0; i<m; i++) { 13059557b74SHong Zhang rowlengths[i] = ai[i+1] - a->diag[i]; 13159557b74SHong Zhang } 132676c34cdSKris Buschelman ierr = MatCreateSeqSBAIJ(PETSC_COMM_SELF,1,m,n,0,rowlengths,&B);CHKERRQ(ierr); 13359557b74SHong Zhang 134676c34cdSKris Buschelman ierr = MatSetOption(B,MAT_ROW_ORIENTED);CHKERRQ(ierr); 135676c34cdSKris Buschelman ierr = MatSetOption(B,MAT_ROWS_SORTED);CHKERRQ(ierr); 136676c34cdSKris Buschelman ierr = MatSetOption(B,MAT_COLUMNS_SORTED);CHKERRQ(ierr); 13759557b74SHong Zhang 138676c34cdSKris Buschelman b = (Mat_SeqSBAIJ*)(B->data); 139861ba921SHong Zhang bi = b->i; 140861ba921SHong Zhang bj = b->j; 141861ba921SHong Zhang bv = b->a; 142861ba921SHong Zhang 143861ba921SHong Zhang bi[0] = 0; 14459557b74SHong Zhang for (i=0; i<m; i++) { 14559557b74SHong Zhang aj = a->j + a->diag[i]; 14659557b74SHong Zhang av = a->a + a->diag[i]; 147861ba921SHong Zhang for (j=0; j<rowlengths[i]; j++){ 148861ba921SHong Zhang *bj = *aj; bj++; aj++; 149861ba921SHong Zhang *bv = *av; bv++; av++; 150861ba921SHong Zhang } 151861ba921SHong Zhang bi[i+1] = bi[i] + rowlengths[i]; 152861ba921SHong Zhang b->ilen[i] = rowlengths[i]; 15359557b74SHong Zhang } 15459557b74SHong Zhang 15559557b74SHong Zhang ierr = PetscFree(rowlengths);CHKERRQ(ierr); 156676c34cdSKris Buschelman ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 157676c34cdSKris Buschelman ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 158676c34cdSKris Buschelman 159676c34cdSKris Buschelman /* Fake support for "inplace" convert. */ 160676c34cdSKris Buschelman if (*newmat == A) { 161676c34cdSKris Buschelman ierr = MatDestroy(A);CHKERRQ(ierr); 162676c34cdSKris Buschelman } 163676c34cdSKris Buschelman *newmat = B; 164676c34cdSKris Buschelman 16559557b74SHong Zhang PetscFunctionReturn(0); 16659557b74SHong Zhang } 16759557b74SHong Zhang EXTERN_C_END 16859557b74SHong Zhang 169