xref: /petsc/src/mat/impls/sbaij/seq/sro.c (revision 7c4f633dc6bb6149cca88d301ead35a99e103cbb)
1be1d678aSKris Buschelman #define PETSCMAT_DLL
2336c05bdSSatish Balay 
3*7c4f633dSBarry Smith #include "../src/mat/impls/baij/seq/baij.h"
4*7c4f633dSBarry Smith #include "../src/inline/spops.h"
5*7c4f633dSBarry Smith #include "../src/mat/impls/sbaij/seq/sbaij.h"
6325e03aeSBarry Smith #include "petscsys.h"
749b5e25fSSatish Balay 
849b5e25fSSatish Balay /*
9392d98d6SHong Zhang This function is used before applying a
10392d98d6SHong Zhang symmetric reordering to matrix A that is
11392d98d6SHong Zhang in SBAIJ format.
12392d98d6SHong Zhang 
13392d98d6SHong Zhang The permutation is assumed to be symmetric, i.e.,
14392d98d6SHong Zhang P = P^T (= inv(P)),
15392d98d6SHong Zhang so the permuted matrix P*A*inv(P)=P*A*P^T is ensured to be symmetric.
16d33dd558SHong Zhang  - a wrong assumption! This code needs rework!  -- Hong
17392d98d6SHong Zhang 
18392d98d6SHong Zhang The function is modified from sro.f of YSMP. The description from YSMP:
19392d98d6SHong Zhang C    THE NONZERO ENTRIES OF THE MATRIX M ARE ASSUMED TO BE STORED
20392d98d6SHong Zhang C    SYMMETRICALLY IN (IA,JA,A) FORMAT (I.E., NOT BOTH M(I,J) AND M(J,I)
21392d98d6SHong Zhang C    ARE STORED IF I NE J).
22392d98d6SHong Zhang C
23392d98d6SHong Zhang C    SRO DOES NOT REARRANGE THE ORDER OF THE ROWS, BUT DOES MOVE
24392d98d6SHong Zhang C    NONZEROES FROM ONE ROW TO ANOTHER TO ENSURE THAT IF M(I,J) WILL BE
25392d98d6SHong Zhang C    IN THE UPPER TRIANGLE OF M WITH RESPECT TO THE NEW ORDERING, THEN
26392d98d6SHong Zhang C    M(I,J) IS STORED IN ROW I (AND THUS M(J,I) IS NOT STORED);  WHEREAS
27392d98d6SHong Zhang C    IF M(I,J) WILL BE IN THE STRICT LOWER TRIANGLE OF M, THEN M(J,I) IS
28392d98d6SHong Zhang C    STORED IN ROW J (AND THUS M(I,J) IS NOT STORED).
29392d98d6SHong Zhang 
3049a6740bSHong Zhang 
318dd41b81SHong Zhang   -- output: new index set (inew, jnew) for A and a map a2anew that maps
328dd41b81SHong Zhang              values a to anew, such that all
338dd41b81SHong Zhang              nonzero A_(perm(i),iperm(k)) will be stored in the upper triangle.
34392d98d6SHong Zhang              Note: matrix A is not permuted by this function!
3549b5e25fSSatish Balay */
364a2ae208SSatish Balay #undef __FUNCT__
374a2ae208SSatish Balay #define __FUNCT__ "MatReorderingSeqSBAIJ"
38be1d678aSKris Buschelman PetscErrorCode PETSCMAT_DLLEXPORT MatReorderingSeqSBAIJ(Mat A,IS perm)
3949b5e25fSSatish Balay {
4049b5e25fSSatish Balay   Mat_SeqSBAIJ   *a=(Mat_SeqSBAIJ *)A->data;
416849ba73SBarry Smith   PetscErrorCode ierr;
425d0c19d7SBarry Smith   const PetscInt mbs=a->mbs,*rip,*riip;
435d0c19d7SBarry Smith   PetscInt       *ai,*aj,*r;
445d0c19d7SBarry Smith   PetscInt       *nzr,nz,jmin,jmax,j,k,ajk,len,i;
4595910c0aSHong Zhang   IS             iperm;  /* inverse of perm */
4649b5e25fSSatish Balay 
4749b5e25fSSatish Balay   PetscFunctionBegin;
4849b5e25fSSatish Balay   if (!mbs) PetscFunctionReturn(0);
49d33dd558SHong Zhang   SETERRQ(PETSC_ERR_SUP,"Matrix reordering is not supported for sbaij matrix. Use aij format");
5095910c0aSHong Zhang   ierr = ISGetIndices(perm,&rip);CHKERRQ(ierr);
51d33dd558SHong Zhang 
5295910c0aSHong Zhang   ierr = ISInvertPermutation(perm,PETSC_DECIDE,&iperm);CHKERRQ(ierr);
5395910c0aSHong Zhang   ierr = ISGetIndices(iperm,&riip);CHKERRQ(ierr);
5449b5e25fSSatish Balay 
5549b5e25fSSatish Balay   for (i=0; i<mbs; i++) {
561302d50aSBarry Smith     if (rip[i] != riip[i]) SETERRQ(PETSC_ERR_ARG_INCOMP,"Non-symmetric permutation, use symmetric permutation for symmetric matrices");
5749b5e25fSSatish Balay   }
58ac355199SBarry Smith   ierr = ISRestoreIndices(iperm,&riip);CHKERRQ(ierr);
59ac355199SBarry Smith   ierr = ISDestroy(iperm);CHKERRQ(ierr);
6095910c0aSHong Zhang 
6133cda0aeSHong Zhang   if (!a->inew){
6213f74950SBarry Smith     len  = (mbs+1 + 2*(a->i[mbs]))*sizeof(PetscInt);
6382502324SSatish Balay     ierr = PetscMalloc(len,&ai);CHKERRQ(ierr);
64f1ab1b7aSHong Zhang     aj   = ai + mbs+1;
6533cda0aeSHong Zhang   } else {
6633cda0aeSHong Zhang     ai = a->inew; aj = a->jnew;
6733cda0aeSHong Zhang   }
6813f74950SBarry Smith   ierr  = PetscMemcpy(ai,a->i,(mbs+1)*sizeof(PetscInt));CHKERRQ(ierr);
6913f74950SBarry Smith   ierr  = PetscMemcpy(aj,a->j,(a->i[mbs])*sizeof(PetscInt));CHKERRQ(ierr);
7033cda0aeSHong Zhang 
71434e015dSHong Zhang   /*
72434e015dSHong Zhang      Phase 1: Find row index r in which to store each nonzero.
73434e015dSHong Zhang 	      Initialize count of nonzeros to be stored in each row (nzr).
74434e015dSHong Zhang               At the end of this phase, a nonzero a(*,*)=a(r(),aj())
75434e015dSHong Zhang               s.t. a(perm(r),perm(aj)) will fall into upper triangle part.
76434e015dSHong Zhang   */
7749b5e25fSSatish Balay 
7813f74950SBarry Smith   ierr = PetscMalloc(mbs*sizeof(PetscInt),&nzr);CHKERRQ(ierr);
7913f74950SBarry Smith   ierr = PetscMalloc(ai[mbs]*sizeof(PetscInt),&r);CHKERRQ(ierr);
8049b5e25fSSatish Balay   for (i=0; i<mbs; i++) nzr[i] = 0;
8149b5e25fSSatish Balay   for (i=0; i<ai[mbs]; i++) r[i] = 0;
8249b5e25fSSatish Balay 
8349b5e25fSSatish Balay   /*  for each nonzero element */
8449b5e25fSSatish Balay   for (i=0; i<mbs; i++){
8549b5e25fSSatish Balay     nz = ai[i+1] - ai[i];
8649b5e25fSSatish Balay     j = ai[i];
8795910c0aSHong Zhang     /* printf("nz = %d, j=%d\n",nz,j); */
8849b5e25fSSatish Balay     while (nz--){
8949b5e25fSSatish Balay       /*  --- find row (=r[j]) and column (=aj[j]) in which to store a[j] ...*/
90434e015dSHong Zhang       k = aj[j];                          /* col. index */
9195910c0aSHong Zhang       /* printf("nz = %d, k=%d\n", nz,k); */
92434e015dSHong Zhang       /* for entry that will be permuted into lower triangle, swap row and col. index */
9349b5e25fSSatish Balay       if (rip[k] < rip[i]) aj[j] = i;
9449b5e25fSSatish Balay       else k = i;
9595910c0aSHong Zhang 
9649b5e25fSSatish Balay       r[j] = k; j++;
9749b5e25fSSatish Balay       nzr[k] ++; /* increment count of nonzeros in that row */
9849b5e25fSSatish Balay     }
9949b5e25fSSatish Balay   }
10049b5e25fSSatish Balay 
101434e015dSHong Zhang   /* Phase 2: Find new ai and permutation to apply to (aj,a).
102434e015dSHong Zhang               Determine pointers (r) to delimit rows in permuted (aj,a).
103434e015dSHong Zhang               Note: r is different from r used in phase 1.
104434e015dSHong Zhang               At the end of this phase, (aj[j],a[j]) will be stored in
105434e015dSHong Zhang               (aj[r(j)],a[r(j)]).
106434e015dSHong Zhang   */
10749b5e25fSSatish Balay     for (i=0; i<mbs; i++){
10849b5e25fSSatish Balay       ai[i+1] = ai[i] + nzr[i];
10949b5e25fSSatish Balay       nzr[i]    = ai[i+1];
11049b5e25fSSatish Balay     }
11149b5e25fSSatish Balay 
112434e015dSHong Zhang   /* determine where each (aj[j], a[j]) is stored in new (aj,a)
11349b5e25fSSatish Balay      for each nonzero element (in reverse order) */
11449b5e25fSSatish Balay   jmin = ai[0]; jmax = ai[mbs];
11549b5e25fSSatish Balay   nz = jmax - jmin;
11649b5e25fSSatish Balay   j = jmax-1;
11749b5e25fSSatish Balay   while (nz--){
11849b5e25fSSatish Balay     i = r[j];  /* row value */
11949b5e25fSSatish Balay     if (aj[j] == i) r[j] = ai[i]; /* put diagonal nonzero at beginning of row */
12049b5e25fSSatish Balay     else { /* put off-diagonal nonzero in last unused location in row */
12149b5e25fSSatish Balay       nzr[i]--; r[j] = nzr[i];
12249b5e25fSSatish Balay     }
12349b5e25fSSatish Balay     j--;
12449b5e25fSSatish Balay   }
12533cda0aeSHong Zhang 
126f1ab1b7aSHong Zhang   a->a2anew = aj + ai[mbs];
12713f74950SBarry Smith   ierr  = PetscMemcpy(a->a2anew,r,ai[mbs]*sizeof(PetscInt));CHKERRQ(ierr);
12849b5e25fSSatish Balay 
12949b5e25fSSatish Balay   /* Phase 3: permute (aj,a) to upper triangular form (wrt new ordering) */
13049b5e25fSSatish Balay   for (j=jmin; j<jmax; j++){
13149b5e25fSSatish Balay     while (r[j] != j){
13249b5e25fSSatish Balay       k = r[j]; r[j] = r[k]; r[k] = k;
13349b5e25fSSatish Balay       ajk = aj[k]; aj[k] = aj[j]; aj[j] = ajk;
134434e015dSHong Zhang       /* ak = aa[k]; aa[k] = aa[j]; aa[j] = ak; */
13549b5e25fSSatish Balay     }
13649b5e25fSSatish Balay   }
137ac355199SBarry Smith   ierr= ISRestoreIndices(perm,&rip);CHKERRQ(ierr);
13849b5e25fSSatish Balay 
139f1ab1b7aSHong Zhang   a->inew = ai;
140f1ab1b7aSHong Zhang   a->jnew = aj;
141f1ab1b7aSHong Zhang 
1428331a44cSBarry Smith   if (a->row) {
1438331a44cSBarry Smith     ierr = ISDestroy(a->row);CHKERRQ(ierr);
1448331a44cSBarry Smith   }
1458331a44cSBarry Smith   if (a->icol) {
1468331a44cSBarry Smith     ierr = ISDestroy(a->icol);CHKERRQ(ierr);
1478331a44cSBarry Smith   }
148c3122656SLisandro Dalcin   ierr = PetscObjectReference((PetscObject)perm);CHKERRQ(ierr);
149c3122656SLisandro Dalcin   if (a->row) { ierr = ISDestroy(a->row);CHKERRQ(ierr); }
15095910c0aSHong Zhang   a->row  = perm;
151c3122656SLisandro Dalcin   ierr = PetscObjectReference((PetscObject)perm);CHKERRQ(ierr);
152c3122656SLisandro Dalcin   if (a->icol) { ierr = ISDestroy(a->icol);CHKERRQ(ierr); }
15395910c0aSHong Zhang   a->icol = perm;
15449b5e25fSSatish Balay 
155ac355199SBarry Smith   ierr = PetscFree(nzr);CHKERRQ(ierr);
156ac355199SBarry Smith   ierr = PetscFree(r);CHKERRQ(ierr);
15795910c0aSHong Zhang 
15849b5e25fSSatish Balay   PetscFunctionReturn(0);
15949b5e25fSSatish Balay }
16049b5e25fSSatish Balay 
161f1ab1b7aSHong Zhang 
162