1*33cda0aeSHong Zhang /*$Id: sro.c,v 1.16 2000/09/20 14:52:19 bsmith Exp hzhang $*/ 2336c05bdSSatish Balay 349b5e25fSSatish Balay #include "petscsys.h" 449b5e25fSSatish Balay #include "src/mat/impls/baij/seq/baij.h" 549b5e25fSSatish Balay #include "src/vec/vecimpl.h" 649b5e25fSSatish Balay #include "src/inline/spops.h" 749b5e25fSSatish Balay #include "sbaij.h" 849b5e25fSSatish Balay 949b5e25fSSatish Balay /* 10392d98d6SHong Zhang This function is used before applying a 11392d98d6SHong Zhang symmetric reordering to matrix A that is 12392d98d6SHong Zhang in SBAIJ format. 13392d98d6SHong Zhang 14392d98d6SHong Zhang The permutation is assumed to be symmetric, i.e., 15392d98d6SHong Zhang P = P^T (= inv(P)), 16392d98d6SHong Zhang so the permuted matrix P*A*inv(P)=P*A*P^T is ensured to be symmetric. 17392d98d6SHong Zhang 18392d98d6SHong Zhang The function is modified from sro.f of YSMP. The description from YSMP: 19392d98d6SHong Zhang C THE NONZERO ENTRIES OF THE MATRIX M ARE ASSUMED TO BE STORED 20392d98d6SHong Zhang C SYMMETRICALLY IN (IA,JA,A) FORMAT (I.E., NOT BOTH M(I,J) AND M(J,I) 21392d98d6SHong Zhang C ARE STORED IF I NE J). 22392d98d6SHong Zhang C 23392d98d6SHong Zhang C SRO DOES NOT REARRANGE THE ORDER OF THE ROWS, BUT DOES MOVE 24392d98d6SHong Zhang C NONZEROES FROM ONE ROW TO ANOTHER TO ENSURE THAT IF M(I,J) WILL BE 25392d98d6SHong Zhang C IN THE UPPER TRIANGLE OF M WITH RESPECT TO THE NEW ORDERING, THEN 26392d98d6SHong Zhang C M(I,J) IS STORED IN ROW I (AND THUS M(J,I) IS NOT STORED); WHEREAS 27392d98d6SHong Zhang C IF M(I,J) WILL BE IN THE STRICT LOWER TRIANGLE OF M, THEN M(J,I) IS 28392d98d6SHong Zhang C STORED IN ROW J (AND THUS M(I,J) IS NOT STORED). 29392d98d6SHong Zhang 3049a6740bSHong Zhang 3149a6740bSHong Zhang -- output: new index set (ai, aj, a) for A such that all 32392d98d6SHong Zhang nonzero A_(p(i),isp(k)) will be stored in the upper triangle. 33392d98d6SHong Zhang Note: matrix A is not permuted by this function! 3449b5e25fSSatish Balay */ 3549b5e25fSSatish Balay #undef __FUNC__ 369ce2e32cSSatish Balay #define __FUNC__ "MatReorderingSeqSBAIJ" 3795910c0aSHong Zhang int MatReorderingSeqSBAIJ(Mat A,IS perm) 3849b5e25fSSatish Balay { 3949b5e25fSSatish Balay Mat_SeqSBAIJ *a=(Mat_SeqSBAIJ *)A->data; 40434e015dSHong Zhang int *r,ierr,i,mbs=a->mbs,*rip,*riip; 41f1ab1b7aSHong Zhang int *ai,*aj; 42f1ab1b7aSHong Zhang int *nzr,nz,jmin,jmax,j,k,ajk,len; 4395910c0aSHong Zhang IS iperm; /* inverse of perm */ 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 4649b5e25fSSatish Balay if (!mbs) PetscFunctionReturn(0); 4795910c0aSHong Zhang ierr = ISGetIndices(perm,&rip);CHKERRQ(ierr); 4895910c0aSHong Zhang ierr = ISInvertPermutation(perm,PETSC_DECIDE,&iperm);CHKERRQ(ierr); 4995910c0aSHong Zhang ierr = ISGetIndices(iperm,&riip);CHKERRQ(ierr); 5049b5e25fSSatish Balay 5149b5e25fSSatish Balay for (i=0; i<mbs; i++) { 52392d98d6SHong Zhang if (rip[i] - riip[i] != 0) SETERRQ(1,1,"Non-symm. permutation, use symm. permutation or general matrix format"); 5349b5e25fSSatish Balay } 5495910c0aSHong Zhang ierr = ISRestoreIndices(iperm,&riip);CHKERRA(ierr); 5595910c0aSHong Zhang ierr = ISDestroy(iperm);CHKERRA(ierr); 5695910c0aSHong Zhang 57*33cda0aeSHong Zhang if (!a->inew){ 58f1ab1b7aSHong Zhang len = (mbs+1 + 2*(a->i[mbs]))*sizeof(int); 59f1ab1b7aSHong Zhang ai = (int*)PetscMalloc(len); CHKPTRQ(ai); 60f1ab1b7aSHong Zhang aj = ai + mbs+1; 61*33cda0aeSHong Zhang } else { 62*33cda0aeSHong Zhang ai = a->inew; aj = a->jnew; 63*33cda0aeSHong Zhang } 64434e015dSHong Zhang ierr = PetscMemcpy(ai,a->i,(mbs+1)*sizeof(int));CHKERRQ(ierr); 65434e015dSHong Zhang ierr = PetscMemcpy(aj,a->j,(a->i[mbs])*sizeof(int));CHKERRQ(ierr); 66*33cda0aeSHong Zhang 67434e015dSHong Zhang /* 68434e015dSHong Zhang Phase 1: Find row index r in which to store each nonzero. 69434e015dSHong Zhang Initialize count of nonzeros to be stored in each row (nzr). 70434e015dSHong Zhang At the end of this phase, a nonzero a(*,*)=a(r(),aj()) 71434e015dSHong Zhang s.t. a(perm(r),perm(aj)) will fall into upper triangle part. 72434e015dSHong Zhang */ 7349b5e25fSSatish Balay 7449b5e25fSSatish Balay nzr = (int*)PetscMalloc(mbs*sizeof(int));CHKPTRQ(nzr); 7549b5e25fSSatish Balay r = (int*)PetscMalloc(ai[mbs]*sizeof(int));CHKPTRQ(r); 7649b5e25fSSatish Balay for (i=0; i<mbs; i++) nzr[i] = 0; 7749b5e25fSSatish Balay for (i=0; i<ai[mbs]; i++) r[i] = 0; 7849b5e25fSSatish Balay 7949b5e25fSSatish Balay /* for each nonzero element */ 8049b5e25fSSatish Balay for (i=0; i<mbs; i++){ 8149b5e25fSSatish Balay nz = ai[i+1] - ai[i]; 8249b5e25fSSatish Balay j = ai[i]; 8395910c0aSHong Zhang /* printf("nz = %d, j=%d\n",nz,j); */ 8449b5e25fSSatish Balay while (nz--){ 8549b5e25fSSatish Balay /* --- find row (=r[j]) and column (=aj[j]) in which to store a[j] ...*/ 86434e015dSHong Zhang k = aj[j]; /* col. index */ 8795910c0aSHong Zhang /* printf("nz = %d, k=%d\n", nz,k); */ 88434e015dSHong Zhang /* for entry that will be permuted into lower triangle, swap row and col. index */ 8949b5e25fSSatish Balay if (rip[k] < rip[i]) aj[j] = i; 9049b5e25fSSatish Balay else k = i; 9195910c0aSHong Zhang 9249b5e25fSSatish Balay r[j] = k; j++; 9349b5e25fSSatish Balay nzr[k] ++; /* increment count of nonzeros in that row */ 9449b5e25fSSatish Balay } 9549b5e25fSSatish Balay } 9649b5e25fSSatish Balay 97434e015dSHong Zhang /* Phase 2: Find new ai and permutation to apply to (aj,a). 98434e015dSHong Zhang Determine pointers (r) to delimit rows in permuted (aj,a). 99434e015dSHong Zhang Note: r is different from r used in phase 1. 100434e015dSHong Zhang At the end of this phase, (aj[j],a[j]) will be stored in 101434e015dSHong Zhang (aj[r(j)],a[r(j)]). 102434e015dSHong Zhang */ 10349b5e25fSSatish Balay for (i=0; i<mbs; i++){ 10449b5e25fSSatish Balay ai[i+1] = ai[i] + nzr[i]; 10549b5e25fSSatish Balay nzr[i] = ai[i+1]; 10649b5e25fSSatish Balay } 10749b5e25fSSatish Balay 108434e015dSHong Zhang /* determine where each (aj[j], a[j]) is stored in new (aj,a) 10949b5e25fSSatish Balay for each nonzero element (in reverse order) */ 11049b5e25fSSatish Balay jmin = ai[0]; jmax = ai[mbs]; 11149b5e25fSSatish Balay nz = jmax - jmin; 11249b5e25fSSatish Balay j = jmax-1; 11349b5e25fSSatish Balay while (nz--){ 11449b5e25fSSatish Balay i = r[j]; /* row value */ 11549b5e25fSSatish Balay if (aj[j] == i) r[j] = ai[i]; /* put diagonal nonzero at beginning of row */ 11649b5e25fSSatish Balay else { /* put off-diagonal nonzero in last unused location in row */ 11749b5e25fSSatish Balay nzr[i]--; r[j] = nzr[i]; 11849b5e25fSSatish Balay } 11949b5e25fSSatish Balay j--; 12049b5e25fSSatish Balay } 121*33cda0aeSHong Zhang 122f1ab1b7aSHong Zhang a->a2anew = aj + ai[mbs]; 123f1ab1b7aSHong Zhang ierr = PetscMemcpy(a->a2anew,r,ai[mbs]*sizeof(int));CHKERRQ(ierr); 12449b5e25fSSatish Balay 12549b5e25fSSatish Balay /* Phase 3: permute (aj,a) to upper triangular form (wrt new ordering) */ 12649b5e25fSSatish Balay for (j=jmin; j<jmax; j++){ 12749b5e25fSSatish Balay while (r[j] != j){ 12849b5e25fSSatish Balay k = r[j]; r[j] = r[k]; r[k] = k; 12949b5e25fSSatish Balay ajk = aj[k]; aj[k] = aj[j]; aj[j] = ajk; 130434e015dSHong Zhang /* ak = aa[k]; aa[k] = aa[j]; aa[j] = ak; */ 13149b5e25fSSatish Balay } 13249b5e25fSSatish Balay } 133507de105SBarry Smith ierr= ISRestoreIndices(perm,&rip);CHKERRA(ierr); 13449b5e25fSSatish Balay 135f1ab1b7aSHong Zhang a->inew = ai; 136f1ab1b7aSHong Zhang a->jnew = aj; 137f1ab1b7aSHong Zhang 1388331a44cSBarry Smith if (a->row) { 1398331a44cSBarry Smith ierr = ISDestroy(a->row);CHKERRQ(ierr); 1408331a44cSBarry Smith } 1418331a44cSBarry Smith if (a->icol) { 1428331a44cSBarry Smith ierr = ISDestroy(a->icol);CHKERRQ(ierr); 1438331a44cSBarry Smith } 14495910c0aSHong Zhang a->row = perm; 14595910c0aSHong Zhang a->icol = perm; 14695910c0aSHong Zhang ierr = PetscObjectReference((PetscObject)perm);CHKERRQ(ierr); 14795910c0aSHong Zhang ierr = PetscObjectReference((PetscObject)perm);CHKERRQ(ierr); 14849b5e25fSSatish Balay 14995910c0aSHong Zhang ierr = PetscFree(nzr);CHKERRA(ierr); 150f1ab1b7aSHong Zhang ierr = PetscFree(r);CHKERRA(ierr); 15195910c0aSHong Zhang 15249b5e25fSSatish Balay PetscFunctionReturn(0); 15349b5e25fSSatish Balay } 15449b5e25fSSatish Balay 155f1ab1b7aSHong Zhang 156