1 2 3 #include "aij.h" 4 #include "inline/spops.h" 5 /* 6 Factorization code for AIJ format. 7 */ 8 9 int MatiAIJLUFactorSymbolic(Mat mat,IS isrow,IS iscol,Mat *fact) 10 { 11 Matiaij *aij = (Matiaij *) mat->data, *aijnew; 12 IS isicol; 13 int *r,*ic, ierr, i, j, n = aij->m, *ai = aij->i, *aj = aij->j; 14 int prow, *ainew,*ajnew, jmax,*fill, *ajtmp, nz , *ii; 15 int *idnew, idx, pivot_row,row,m,fm, nnz, nzi,len; 16 17 if (n != aij->n) SETERR(1,"Mat must be square"); 18 if (!isrow) {SETERR(1,"Must have row permutation");} 19 if (!iscol) {SETERR(1,"Must have column permutation");} 20 21 if (ierr = ISInvertPermutation(iscol,&isicol)) SETERR(ierr,0); 22 ISGetIndices(isrow,&r); ISGetIndices(isicol,&ic); 23 24 /* get new row pointers */ 25 ainew = (int *) MALLOC( (n+1)*sizeof(int) ); CHKPTR(ainew); 26 ainew[0] = 1; 27 /* don't know how many column pointers are needed so estimate */ 28 jmax = 2*ai[n]; 29 ajnew = (int *) MALLOC( (jmax)*sizeof(int) ); CHKPTR(ajnew); 30 /* fill is a linked list of nonzeros in active row */ 31 fill = (int *) MALLOC( (n+1)*sizeof(int)); CHKPTR(fill); 32 /* idnew is location of diagonal in factor */ 33 idnew = (int *) MALLOC( (n+1)*sizeof(int)); CHKPTR(idnew); 34 idnew[0] = 1; 35 36 for ( i=0; i<n; i++ ) { 37 /* first copy previous fill into linked list */ 38 nnz = nz = ai[r[i]+1] - ai[r[i]]; 39 ajtmp = aj + ai[r[i]] - 1; 40 fill[n] = n; 41 while (nz--) { 42 fm = n; 43 idx = ic[*ajtmp++ - 1]; 44 do { 45 m = fm; 46 fm = fill[m]; 47 } while (fm < idx); 48 fill[m] = idx; 49 fill[idx] = fm; 50 } 51 row = fill[n]; 52 while ( row < i ) { 53 ajtmp = ajnew + idnew[row] - 1; 54 nz = ainew[row+1] - idnew[row]; 55 fm = row; 56 while (nz--) { 57 fm = n; 58 idx = *ajtmp++ - 1; 59 do { 60 m = fm; 61 fm = fill[m]; 62 } while (fm < idx); 63 if (fm != idx) { 64 fill[m] = idx; 65 fill[idx] = fm; 66 fm = idx; 67 nnz++; 68 } 69 } 70 row = fill[row]; 71 } 72 /* copy new filled row into permanent storage */ 73 ainew[i+1] = ainew[i] + nnz; 74 if (ainew[i+1] > jmax+1) { 75 /* allocate a longer ajnew */ 76 jmax += nnz*(n-i); 77 ajtmp = (int *) MALLOC( jmax*sizeof(int) );CHKPTR(ajtmp); 78 MEMCPY(ajtmp,ajnew,(ainew[i]-1)*sizeof(int)); 79 FREE(ajnew); 80 ajnew = ajtmp; 81 } 82 ajtmp = ajnew + ainew[i] - 1; 83 fm = fill[n]; 84 nzi = 0; 85 while (nnz--) { 86 if (fm < i) nzi++; 87 *ajtmp++ = fm + 1; 88 fm = fill[fm]; 89 } 90 idnew[i] = ainew[i] + nzi; 91 } 92 93 ISDestroy(isicol); FREE(fill); 94 95 /* put together the new matrix */ 96 ierr = MatCreateSequentialAIJ(n, n, 0, 0, fact); CHKERR(ierr); 97 aijnew = (Matiaij *) (*fact)->data; 98 FREE(aijnew->imax); 99 aijnew->singlemalloc = 0; 100 len = (ainew[n] - 1)*sizeof(Scalar); 101 /* the next line frees the default space generated by the Create() */ 102 FREE(aijnew->a); FREE(aijnew->ilen); 103 aijnew->a = (Scalar *) MALLOC( len ); CHKPTR(aijnew->a); 104 aijnew->j = ajnew; 105 aijnew->i = ainew; 106 aijnew->diag = idnew; 107 aijnew->ilen = 0; 108 aijnew->imax = 0; 109 (*fact)->row = isrow; 110 (*fact)->col = iscol; 111 (*fact)->factor = FACTOR_LU; 112 return 0; 113 } 114 115 int MatiAIJLUFactorNumeric(Mat mat,Mat *infact) 116 { 117 Mat fact = *infact; 118 Matiaij *aij = (Matiaij *) mat->data, *aijnew = (Matiaij *)fact->data; 119 IS iscol = fact->col, isrow = fact->row, isicol; 120 int *r,*ic, ierr, i, j, n = aij->m, *ai = aijnew->i, *aj = aijnew->j; 121 int prow, *ainew,*ajnew, jmax,*fill, *ajtmpold, *ajtmp, nz , *ii; 122 int *idnew, idx, pivot_row,row,*pj, m,fm, nnz, nzi,len; 123 Scalar *rtmp,*vnew,*v, *pv, *pc, multiplier; 124 125 if (ierr = ISInvertPermutation(iscol,&isicol)) SETERR(ierr,0); 126 ierr = ISGetIndices(isrow,&r); CHKERR(ierr); 127 ierr = ISGetIndices(isicol,&ic); CHKERR(ierr); 128 rtmp = (Scalar *) MALLOC( (n+1)*sizeof(Scalar) ); CHKPTR(rtmp); 129 130 for ( i=0; i<n; i++ ) { 131 nz = ai[i+1] - ai[i]; 132 ajtmp = aj + ai[i] - 1; 133 for ( j=0; j<nz; j++ ) rtmp[ajtmp[j]-1] = 0.0; 134 135 /* load in initial (unfactored row) */ 136 nz = aij->i[r[i]+1] - aij->i[r[i]]; 137 ajtmpold = aij->j + aij->i[r[i]] - 1; 138 v = aij->a + aij->i[r[i]] - 1; 139 for ( j=0; j<nz; j++ ) rtmp[ic[ajtmpold[j]-1]] = v[j]; 140 141 row = *ajtmp++ - 1; 142 while (row < i) { 143 pc = rtmp + row; 144 if (*pc != 0.0) { 145 nz = aijnew->diag[row] - ai[row]; 146 pv = aijnew->a + aijnew->diag[row] - 1; 147 pj = aijnew->j + aijnew->diag[row]; 148 multiplier = *pc * *pv++; 149 *pc = multiplier; 150 nz = ai[row+1] - ai[row] - 1 - nz; 151 while (nz-->0) rtmp[*pj++ - 1] -= multiplier* *pv++; 152 } 153 row = *ajtmp++ - 1; 154 } 155 /* finished row so stick it into aijnew->a */ 156 pv = aijnew->a + ai[i] - 1; 157 pj = aijnew->j + ai[i] - 1; 158 nz = ai[i+1] - ai[i]; 159 rtmp[i] = 1.0/rtmp[i]; 160 for ( j=0; j<nz; j++ ) {pv[j] = rtmp[pj[j]-1];} 161 } 162 FREE(rtmp); 163 ierr = ISRestoreIndices(isicol,&ic); CHKERR(ierr); 164 ierr = ISRestoreIndices(isrow,&r); CHKERR(ierr); 165 ierr = ISDestroy(isicol); CHKERR(ierr); 166 fact->factor = FACTOR_LU; 167 168 return 0; 169 } 170 int MatiAIJLUFactor(Mat matin,IS row,IS col) 171 { 172 Matiaij *mat = (Matiaij *) matin->data; 173 int ierr, info; 174 Mat fact; 175 ierr = MatiAIJLUFactorSymbolic(matin,row,col,&fact); CHKERR(ierr); 176 ierr = MatiAIJLUFactorNumeric(matin,&fact); CHKERR(ierr); 177 178 /* free all the data structures from mat */ 179 FREE(mat->a); 180 if (!mat->singlemalloc) {FREE(mat->i); FREE(mat->j);} 181 if (mat->diag) FREE(mat->diag); 182 if (mat->ilen) FREE(mat->ilen); 183 if (mat->imax) FREE(mat->imax); 184 if (matin->row && matin->col && matin->row != matin->col) { 185 ISDestroy(matin->row); 186 } 187 if (matin->col) ISDestroy(matin->col); 188 FREE(mat); 189 190 MEMCPY(matin,fact,sizeof(struct _Mat)); 191 FREE(fact); 192 return 0; 193 } 194 195 int MatiAIJSolve(Mat mat,Vec bb, Vec xx) 196 { 197 Matiaij *aij = (Matiaij *) mat->data; 198 IS iscol = mat->col, isrow = mat->row; 199 int *r,*c, ierr, i, j, n = aij->m, *vi, *ai = aij->i, *aj = aij->j; 200 int nz; 201 Scalar *x,*b,*tmp, *aa = aij->a, sum, *v; 202 203 if (ierr = VecGetArray(bb,&b)) SETERR(ierr,0); 204 if (ierr = VecGetArray(xx,&x)) SETERR(ierr,0); 205 tmp = (Scalar *) MALLOC(n*sizeof(Scalar)); CHKPTR(tmp); 206 207 if (ierr = ISGetIndices(isrow,&r)) SETERR(ierr,0); 208 if (ierr = ISGetIndices(iscol,&c)) SETERR(ierr,0); c = c + (n-1); 209 210 /* forward solve the lower triangular */ 211 tmp[0] = b[*r++]; 212 for ( i=1; i<n; i++ ) { 213 v = aa + ai[i] - 1; 214 vi = aj + ai[i] - 1; 215 nz = aij->diag[i] - ai[i]; 216 sum = b[*r++]; 217 while (nz--) sum -= *v++ * tmp[*vi++ - 1]; 218 tmp[i] = sum; 219 } 220 221 /* backward solve the upper triangular */ 222 for ( i=n-1; i>=0; i-- ){ 223 v = aa + aij->diag[i]; 224 vi = aj + aij->diag[i]; 225 nz = ai[i+1] - aij->diag[i] - 1; 226 sum = tmp[i]; 227 while (nz--) sum -= *v++ * tmp[*vi++ - 1]; 228 x[*c--] = tmp[i] = sum*aa[aij->diag[i]-1]; 229 } 230 231 FREE(tmp); 232 return 0; 233 } 234 int MatiAIJSolveAdd(Mat mat,Vec bb, Vec yy, Vec xx) 235 { 236 Matiaij *aij = (Matiaij *) mat->data; 237 IS iscol = mat->col, isrow = mat->row; 238 int *r,*c, ierr, i, j, n = aij->m, *vi, *ai = aij->i, *aj = aij->j; 239 int nz; 240 Scalar *x,*b,*tmp, *aa = aij->a, sum, *v; 241 242 if (yy != xx) {ierr = VecCopy(yy,xx); CHKERR(ierr);} 243 244 if (ierr = VecGetArray(bb,&b)) SETERR(ierr,0); 245 if (ierr = VecGetArray(xx,&x)) SETERR(ierr,0); 246 tmp = (Scalar *) MALLOC(n*sizeof(Scalar)); CHKPTR(tmp); 247 248 if (ierr = ISGetIndices(isrow,&r)) SETERR(ierr,0); 249 if (ierr = ISGetIndices(iscol,&c)) SETERR(ierr,0); c = c + (n-1); 250 251 /* forward solve the lower triangular */ 252 tmp[0] = b[*r++]; 253 for ( i=1; i<n; i++ ) { 254 v = aa + ai[i] - 1; 255 vi = aj + ai[i] - 1; 256 nz = aij->diag[i] - ai[i]; 257 sum = b[*r++]; 258 while (nz--) sum -= *v++ * tmp[*vi++ - 1]; 259 tmp[i] = sum; 260 } 261 262 /* backward solve the upper triangular */ 263 for ( i=n-1; i>=0; i-- ){ 264 v = aa + aij->diag[i]; 265 vi = aj + aij->diag[i]; 266 nz = ai[i+1] - aij->diag[i] - 1; 267 sum = tmp[i]; 268 while (nz--) sum -= *v++ * tmp[*vi++ - 1]; 269 tmp[i] = sum*aa[aij->diag[i]-1]; 270 x[*c--] += tmp[i]; 271 } 272 273 FREE(tmp); 274 return 0; 275 } 276 /* -------------------------------------------------------------------*/ 277 int MatiAIJSolveTrans(Mat mat,Vec bb, Vec xx) 278 { 279 Matiaij *aij = (Matiaij *) mat->data; 280 IS iscol = mat->col, isrow = mat->row, invisrow,inviscol; 281 int *r,*c, ierr, i, j, n = aij->m, *vi, *ai = aij->i, *aj = aij->j; 282 int nz; 283 Scalar *x,*b,*tmp, *aa = aij->a, sum, *v; 284 285 if (ierr = VecGetArray(bb,&b)) SETERR(ierr,0); 286 if (ierr = VecGetArray(xx,&x)) SETERR(ierr,0); 287 tmp = (Scalar *) MALLOC(n*sizeof(Scalar)); CHKPTR(tmp); 288 289 /* invert the permutations */ 290 ierr = ISInvertPermutation(isrow,&invisrow); CHKERR(ierr); 291 ierr = ISInvertPermutation(iscol,&inviscol); CHKERR(ierr); 292 293 294 if (ierr = ISGetIndices(invisrow,&r)) SETERR(ierr,0); 295 if (ierr = ISGetIndices(inviscol,&c)) SETERR(ierr,0); 296 297 /* copy the b into temp work space according to permutation */ 298 for ( i=0; i<n; i++ ) tmp[c[i]] = b[i]; 299 300 /* forward solve the U^T */ 301 for ( i=0; i<n; i++ ) { 302 v = aa + aij->diag[i] - 1; 303 vi = aj + aij->diag[i]; 304 nz = ai[i+1] - aij->diag[i] - 1; 305 tmp[i] *= *v++; 306 while (nz--) { 307 tmp[*vi++ - 1] -= (*v++)*tmp[i]; 308 } 309 } 310 311 /* backward solve the L^T */ 312 for ( i=n-1; i>=0; i-- ){ 313 v = aa + aij->diag[i] - 2; 314 vi = aj + aij->diag[i] - 2; 315 nz = aij->diag[i] - ai[i]; 316 while (nz--) { 317 tmp[*vi-- - 1] -= (*v--)*tmp[i]; 318 } 319 } 320 321 /* copy tmp into x according to permutation */ 322 for ( i=0; i<n; i++ ) x[r[i]] = tmp[i]; 323 324 ISDestroy(invisrow); ISDestroy(inviscol); 325 326 FREE(tmp); 327 return 0; 328 } 329 330 int MatiAIJSolveTransAdd(Mat mat,Vec bb, Vec xx,Vec zz) 331 { 332 Matiaij *aij = (Matiaij *) mat->data; 333 } 334