xref: /petsc/src/mat/impls/baij/seq/dgefa2.c (revision c9b7c5609a4b8cd4e09bf388afdf237c5b17664b)
1be1d678aSKris Buschelman 
284643e36SBarry Smith /*
3*c9b7c560SHong Zhang      Inverts 2 by 2 matrix using gaussian elimination with partial pivoting.
484643e36SBarry Smith 
584643e36SBarry Smith        Used by the sparse factorization routines in
6dd882469SBarry Smith      src/mat/impls/baij/seq
784643e36SBarry Smith 
884643e36SBarry Smith 
984643e36SBarry Smith        This is a combination of the Linpack routines
1084643e36SBarry Smith     dgefa() and dgedi() specialized for a size of 2.
1184643e36SBarry Smith 
1284643e36SBarry Smith */
13c6db04a5SJed Brown #include <petscsys.h>
1484643e36SBarry Smith 
154a2ae208SSatish Balay #undef __FUNCT__
1696b95a6bSBarry Smith #define __FUNCT__ "PetscKernel_A_gets_inverse_A_2"
172e92ee13SHong Zhang PETSC_EXTERN PetscErrorCode PetscKernel_A_gets_inverse_A_2(MatScalar *a,PetscReal shift,PetscBool allowzeropivot,PetscBool *zeropivotdetected)
1884643e36SBarry Smith {
19690b6cddSBarry Smith   PetscInt  i__2,i__3,kp1,j,k,l,ll,i,ipvt[2],k3;
20690b6cddSBarry Smith   PetscInt  k4,j3;
21b48ee343SBarry Smith   MatScalar *aa,*ax,*ay,work[4],stmp;
22329f5518SBarry Smith   MatReal   tmp,max;
2384643e36SBarry Smith 
2484643e36SBarry Smith   PetscFunctionBegin;
25c80103daSHong Zhang   if (zeropivotdetected) *zeropivotdetected = PETSC_FALSE;
26943c8ff5SShri Abhyankar   shift = .25*shift*(1.e-12 + PetscAbsScalar(a[0]) + PetscAbsScalar(a[3]));
27*c9b7c560SHong Zhang 
2884643e36SBarry Smith   /* Parameter adjustments */
2984643e36SBarry Smith   a -= 3;
3084643e36SBarry Smith 
3184643e36SBarry Smith   k   = 1;
3284643e36SBarry Smith   kp1 = k + 1;
3384643e36SBarry Smith   k3  = 2*k;
3484643e36SBarry Smith   k4  = k3 + k;
3584643e36SBarry Smith 
36*c9b7c560SHong Zhang   /* find l = pivot index */
37ed33f8a5SSatish Balay   i__2 = 3 - k;
3884643e36SBarry Smith   aa   = &a[k4];
3984643e36SBarry Smith   max  = PetscAbsScalar(aa[0]);
4084643e36SBarry Smith   l    = 1;
4184643e36SBarry Smith   for (ll=1; ll<i__2; ll++) {
4284643e36SBarry Smith     tmp = PetscAbsScalar(aa[ll]);
4384643e36SBarry Smith     if (tmp > max) { max = tmp; l = ll+1;}
4484643e36SBarry Smith   }
4584643e36SBarry Smith   l        += k - 1;
46b48ee343SBarry Smith   ipvt[k-1] = l;
4784643e36SBarry Smith 
48943c8ff5SShri Abhyankar   if (a[l + k3] == 0.0) {
4926fbe8dcSKarl Rupp     if (shift == 0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",k-1);
5026fbe8dcSKarl Rupp     else {
51943c8ff5SShri Abhyankar       a[l + k3] = shift;
52943c8ff5SShri Abhyankar     }
53943c8ff5SShri Abhyankar   }
5484643e36SBarry Smith 
5584643e36SBarry Smith   /* interchange if necessary */
5684643e36SBarry Smith   if (l != k) {
5784643e36SBarry Smith     stmp      = a[l + k3];
5884643e36SBarry Smith     a[l + k3] = a[k4];
5984643e36SBarry Smith     a[k4]     = stmp;
6084643e36SBarry Smith   }
6184643e36SBarry Smith 
6284643e36SBarry Smith   /* compute multipliers */
6384643e36SBarry Smith   stmp = -1. / a[k4];
6484643e36SBarry Smith   i__2 = 2 - k;
6584643e36SBarry Smith   aa = &a[1 + k4];
6626fbe8dcSKarl Rupp   for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
6784643e36SBarry Smith 
6884643e36SBarry Smith   /* row elimination with column indexing */
6984643e36SBarry Smith   ax = &a[k4+1];
7084643e36SBarry Smith   for (j = kp1; j <= 2; ++j) {
7184643e36SBarry Smith     j3   = 2*j;
7284643e36SBarry Smith     stmp = a[l + j3];
7384643e36SBarry Smith     if (l != k) {
7484643e36SBarry Smith       a[l + j3] = a[k + j3];
7584643e36SBarry Smith       a[k + j3] = stmp;
7684643e36SBarry Smith     }
7784643e36SBarry Smith 
7884643e36SBarry Smith     i__3 = 2 - k;
7984643e36SBarry Smith     ay   = &a[1+k+j3];
8026fbe8dcSKarl Rupp     for (ll=0; ll<i__3; ll++) ay[ll] += stmp*ax[ll];
8184643e36SBarry Smith   }
8226fbe8dcSKarl Rupp 
83b48ee343SBarry Smith   ipvt[1] = 2;
842e92ee13SHong Zhang   if (a[6] == 0.0) {
852e92ee13SHong Zhang     PetscErrorCode ierr;
862e92ee13SHong Zhang     if (allowzeropivot) {
872e92ee13SHong Zhang       ierr = PetscInfo1(NULL,"Zero pivot, row %D\n",1);CHKERRQ(ierr);
882e92ee13SHong Zhang       *zeropivotdetected = PETSC_TRUE;
892e92ee13SHong Zhang     } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",1);
902e92ee13SHong Zhang   }
9184643e36SBarry Smith 
92*c9b7c560SHong Zhang   /* Now form the inverse */
9384643e36SBarry Smith   /* compute inverse(u) */
9484643e36SBarry Smith   for (k = 1; k <= 2; ++k) {
9584643e36SBarry Smith     k3    = 2*k;
9684643e36SBarry Smith     k4    = k3 + k;
9784643e36SBarry Smith     a[k4] = 1.0 / a[k4];
9884643e36SBarry Smith     stmp  = -a[k4];
9984643e36SBarry Smith     i__2  = k - 1;
10084643e36SBarry Smith     aa    = &a[k3 + 1];
10184643e36SBarry Smith     for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
10284643e36SBarry Smith     kp1 = k + 1;
10384643e36SBarry Smith     if (2 < kp1) continue;
10484643e36SBarry Smith     ax = aa;
10584643e36SBarry Smith     for (j = kp1; j <= 2; ++j) {
10684643e36SBarry Smith       j3        = 2*j;
10784643e36SBarry Smith       stmp      = a[k + j3];
10884643e36SBarry Smith       a[k + j3] = 0.0;
10984643e36SBarry Smith       ay        = &a[j3 + 1];
11026fbe8dcSKarl Rupp       for (ll=0; ll<k; ll++) ay[ll] += stmp*ax[ll];
11184643e36SBarry Smith     }
11284643e36SBarry Smith   }
11384643e36SBarry Smith 
11484643e36SBarry Smith   /* form inverse(u)*inverse(l) */
11584643e36SBarry Smith   k   = 1;
11684643e36SBarry Smith   k3  = 2*k;
11784643e36SBarry Smith   kp1 = k + 1;
11884643e36SBarry Smith   aa  = a + k3;
11984643e36SBarry Smith   for (i = kp1; i <= 2; ++i) {
120b48ee343SBarry Smith     work[i-1] = aa[i];
12184643e36SBarry Smith     aa[i]     = 0.0;
12284643e36SBarry Smith   }
12384643e36SBarry Smith   for (j = kp1; j <= 2; ++j) {
124b48ee343SBarry Smith     stmp   = work[j-1];
12584643e36SBarry Smith     ax     = &a[2*j + 1];
12684643e36SBarry Smith     ay     = &a[k3 + 1];
12784643e36SBarry Smith     ay[0] += stmp*ax[0];
12884643e36SBarry Smith     ay[1] += stmp*ax[1];
12984643e36SBarry Smith   }
130b48ee343SBarry Smith   l = ipvt[k-1];
13184643e36SBarry Smith   if (l != k) {
13284643e36SBarry Smith     ax   = &a[k3 + 1];
13384643e36SBarry Smith     ay   = &a[2*l + 1];
13484643e36SBarry Smith     stmp = ax[0]; ax[0] = ay[0]; ay[0] = stmp;
13584643e36SBarry Smith     stmp = ax[1]; ax[1] = ay[1]; ay[1] = stmp;
13684643e36SBarry Smith   }
13784643e36SBarry Smith   PetscFunctionReturn(0);
13884643e36SBarry Smith }
13984643e36SBarry Smith 
1403dfa136dSBarry Smith #undef __FUNCT__
14196b95a6bSBarry Smith #define __FUNCT__ "PetscKernel_A_gets_inverse_A_9"
1422e92ee13SHong Zhang PETSC_EXTERN PetscErrorCode PetscKernel_A_gets_inverse_A_9(MatScalar *a,PetscReal shift,PetscBool allowzeropivot,PetscBool *zeropivotdetected)
1433dfa136dSBarry Smith {
1443dfa136dSBarry Smith   PetscInt  i__2,i__3,kp1,j,k,l,ll,i,ipvt[9],kb,k3;
1453dfa136dSBarry Smith   PetscInt  k4,j3;
1463dfa136dSBarry Smith   MatScalar *aa,*ax,*ay,work[81],stmp;
1473dfa136dSBarry Smith   MatReal   tmp,max;
1483dfa136dSBarry Smith 
1493dfa136dSBarry Smith   /* gaussian elimination with partial pivoting */
1503dfa136dSBarry Smith 
1513dfa136dSBarry Smith   PetscFunctionBegin;
152c80103daSHong Zhang   if (zeropivotdetected) *zeropivotdetected = PETSC_FALSE;
153c80103daSHong Zhang 
1543dfa136dSBarry Smith   /* Parameter adjustments */
1553dfa136dSBarry Smith   a -= 10;
1563dfa136dSBarry Smith 
1573dfa136dSBarry Smith   for (k = 1; k <= 8; ++k) {
1583dfa136dSBarry Smith     kp1 = k + 1;
1593dfa136dSBarry Smith     k3  = 9*k;
1603dfa136dSBarry Smith     k4  = k3 + k;
1613dfa136dSBarry Smith     /* find l = pivot index */
1623dfa136dSBarry Smith 
163c38ccd74SBarry Smith     i__2 = 10 - k;
1643dfa136dSBarry Smith     aa   = &a[k4];
1653dfa136dSBarry Smith     max  = PetscAbsScalar(aa[0]);
1663dfa136dSBarry Smith     l    = 1;
1673dfa136dSBarry Smith     for (ll=1; ll<i__2; ll++) {
1683dfa136dSBarry Smith       tmp = PetscAbsScalar(aa[ll]);
1693dfa136dSBarry Smith       if (tmp > max) { max = tmp; l = ll+1;}
1703dfa136dSBarry Smith     }
1713dfa136dSBarry Smith     l        += k - 1;
1723dfa136dSBarry Smith     ipvt[k-1] = l;
1733dfa136dSBarry Smith 
17465e19b50SBarry Smith     if (a[l + k3] == 0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",k-1);
1753dfa136dSBarry Smith 
1763dfa136dSBarry Smith     /* interchange if necessary */
1773dfa136dSBarry Smith 
1783dfa136dSBarry Smith     if (l != k) {
1793dfa136dSBarry Smith       stmp      = a[l + k3];
1803dfa136dSBarry Smith       a[l + k3] = a[k4];
1813dfa136dSBarry Smith       a[k4]     = stmp;
1823dfa136dSBarry Smith     }
1833dfa136dSBarry Smith 
1843dfa136dSBarry Smith     /* compute multipliers */
1853dfa136dSBarry Smith 
1863dfa136dSBarry Smith     stmp = -1. / a[k4];
1873dfa136dSBarry Smith     i__2 = 9 - k;
1883dfa136dSBarry Smith     aa = &a[1 + k4];
18926fbe8dcSKarl Rupp     for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
1903dfa136dSBarry Smith 
1913dfa136dSBarry Smith     /* row elimination with column indexing */
1923dfa136dSBarry Smith 
1933dfa136dSBarry Smith     ax = &a[k4+1];
1943dfa136dSBarry Smith     for (j = kp1; j <= 9; ++j) {
1953dfa136dSBarry Smith       j3   = 9*j;
1963dfa136dSBarry Smith       stmp = a[l + j3];
1973dfa136dSBarry Smith       if (l != k) {
1983dfa136dSBarry Smith         a[l + j3] = a[k + j3];
1993dfa136dSBarry Smith         a[k + j3] = stmp;
2003dfa136dSBarry Smith       }
2013dfa136dSBarry Smith 
2023dfa136dSBarry Smith       i__3 = 9 - k;
2033dfa136dSBarry Smith       ay = &a[1+k+j3];
20426fbe8dcSKarl Rupp       for (ll=0; ll<i__3; ll++) ay[ll] += stmp*ax[ll];
2053dfa136dSBarry Smith     }
2063dfa136dSBarry Smith   }
2073dfa136dSBarry Smith   ipvt[8] = 9;
2082e92ee13SHong Zhang   if (a[90] == 0.0) {
2092e92ee13SHong Zhang     PetscErrorCode ierr;
2102e92ee13SHong Zhang     if (allowzeropivot) {
2112e92ee13SHong Zhang       ierr = PetscInfo1(NULL,"Zero pivot, row %D\n",6);CHKERRQ(ierr);
2122e92ee13SHong Zhang       *zeropivotdetected = PETSC_TRUE;
2132e92ee13SHong Zhang     } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",6);
2142e92ee13SHong Zhang   }
2153dfa136dSBarry Smith 
2163dfa136dSBarry Smith   /*
2173dfa136dSBarry Smith    Now form the inverse
2183dfa136dSBarry Smith   */
2193dfa136dSBarry Smith 
2203dfa136dSBarry Smith   /* compute inverse(u) */
2213dfa136dSBarry Smith 
2223dfa136dSBarry Smith   for (k = 1; k <= 9; ++k) {
2233dfa136dSBarry Smith     k3    = 9*k;
2243dfa136dSBarry Smith     k4    = k3 + k;
2253dfa136dSBarry Smith     a[k4] = 1.0 / a[k4];
2263dfa136dSBarry Smith     stmp  = -a[k4];
2273dfa136dSBarry Smith     i__2  = k - 1;
2283dfa136dSBarry Smith     aa    = &a[k3 + 1];
2293dfa136dSBarry Smith     for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
2303dfa136dSBarry Smith     kp1 = k + 1;
2313dfa136dSBarry Smith     if (9 < kp1) continue;
2323dfa136dSBarry Smith     ax = aa;
2333dfa136dSBarry Smith     for (j = kp1; j <= 9; ++j) {
2343dfa136dSBarry Smith       j3        = 9*j;
2353dfa136dSBarry Smith       stmp      = a[k + j3];
2363dfa136dSBarry Smith       a[k + j3] = 0.0;
2373dfa136dSBarry Smith       ay        = &a[j3 + 1];
23826fbe8dcSKarl Rupp       for (ll=0; ll<k; ll++) ay[ll] += stmp*ax[ll];
2393dfa136dSBarry Smith     }
2403dfa136dSBarry Smith   }
2413dfa136dSBarry Smith 
2423dfa136dSBarry Smith   /* form inverse(u)*inverse(l) */
2433dfa136dSBarry Smith 
2443dfa136dSBarry Smith   for (kb = 1; kb <= 8; ++kb) {
2453dfa136dSBarry Smith     k   = 9 - kb;
2463dfa136dSBarry Smith     k3  = 9*k;
2473dfa136dSBarry Smith     kp1 = k + 1;
2483dfa136dSBarry Smith     aa  = a + k3;
2493dfa136dSBarry Smith     for (i = kp1; i <= 9; ++i) {
2503dfa136dSBarry Smith       work[i-1] = aa[i];
2513dfa136dSBarry Smith       aa[i]     = 0.0;
2523dfa136dSBarry Smith     }
2533dfa136dSBarry Smith     for (j = kp1; j <= 9; ++j) {
2543dfa136dSBarry Smith       stmp   = work[j-1];
2553dfa136dSBarry Smith       ax     = &a[9*j + 1];
2563dfa136dSBarry Smith       ay     = &a[k3 + 1];
2573dfa136dSBarry Smith       ay[0] += stmp*ax[0];
2583dfa136dSBarry Smith       ay[1] += stmp*ax[1];
2593dfa136dSBarry Smith       ay[2] += stmp*ax[2];
2603dfa136dSBarry Smith       ay[3] += stmp*ax[3];
2613dfa136dSBarry Smith       ay[4] += stmp*ax[4];
2623dfa136dSBarry Smith       ay[5] += stmp*ax[5];
2633dfa136dSBarry Smith       ay[6] += stmp*ax[6];
2643dfa136dSBarry Smith       ay[7] += stmp*ax[7];
2653dfa136dSBarry Smith       ay[8] += stmp*ax[8];
2663dfa136dSBarry Smith     }
2673dfa136dSBarry Smith     l = ipvt[k-1];
2683dfa136dSBarry Smith     if (l != k) {
2693dfa136dSBarry Smith       ax   = &a[k3 + 1];
2703dfa136dSBarry Smith       ay   = &a[9*l + 1];
2713dfa136dSBarry Smith       stmp = ax[0]; ax[0] = ay[0]; ay[0] = stmp;
2723dfa136dSBarry Smith       stmp = ax[1]; ax[1] = ay[1]; ay[1] = stmp;
2733dfa136dSBarry Smith       stmp = ax[2]; ax[2] = ay[2]; ay[2] = stmp;
2743dfa136dSBarry Smith       stmp = ax[3]; ax[3] = ay[3]; ay[3] = stmp;
2753dfa136dSBarry Smith       stmp = ax[4]; ax[4] = ay[4]; ay[4] = stmp;
2763dfa136dSBarry Smith       stmp = ax[5]; ax[5] = ay[5]; ay[5] = stmp;
2773dfa136dSBarry Smith       stmp = ax[6]; ax[6] = ay[6]; ay[6] = stmp;
2783dfa136dSBarry Smith       stmp = ax[7]; ax[7] = ay[7]; ay[7] = stmp;
2793dfa136dSBarry Smith       stmp = ax[8]; ax[8] = ay[8]; ay[8] = stmp;
2803dfa136dSBarry Smith     }
2813dfa136dSBarry Smith   }
2823dfa136dSBarry Smith   PetscFunctionReturn(0);
2833dfa136dSBarry Smith }
28484643e36SBarry Smith 
28529a97285SShri Abhyankar /*
28629a97285SShri Abhyankar       Inverts 15 by 15 matrix using partial pivoting.
28729a97285SShri Abhyankar 
28829a97285SShri Abhyankar        Used by the sparse factorization routines in
28929a97285SShri Abhyankar      src/mat/impls/baij/seq
29029a97285SShri Abhyankar 
29129a97285SShri Abhyankar        This is a combination of the Linpack routines
29229a97285SShri Abhyankar     dgefa() and dgedi() specialized for a size of 15.
29329a97285SShri Abhyankar 
29429a97285SShri Abhyankar */
29529a97285SShri Abhyankar 
29629a97285SShri Abhyankar #undef __FUNCT__
29796b95a6bSBarry Smith #define __FUNCT__ "PetscKernel_A_gets_inverse_A_15"
298922032d7SHong Zhang PETSC_EXTERN PetscErrorCode PetscKernel_A_gets_inverse_A_15(MatScalar *a,PetscInt *ipvt,MatScalar *work,PetscReal shift,PetscBool allowzeropivot,PetscBool *zeropivotdetected)
29929a97285SShri Abhyankar {
300766f9fbaSBarry Smith   PetscInt  i__2,i__3,kp1,j,k,l,ll,i,kb,k3;
30129a97285SShri Abhyankar   PetscInt  k4,j3;
302766f9fbaSBarry Smith   MatScalar *aa,*ax,*ay,stmp;
30329a97285SShri Abhyankar   MatReal   tmp,max;
30429a97285SShri Abhyankar 
30529a97285SShri Abhyankar   /* gaussian elimination with partial pivoting */
30629a97285SShri Abhyankar 
30729a97285SShri Abhyankar   PetscFunctionBegin;
308c80103daSHong Zhang   if (zeropivotdetected) *zeropivotdetected = PETSC_FALSE;
309c80103daSHong Zhang 
31029a97285SShri Abhyankar   /* Parameter adjustments */
31129a97285SShri Abhyankar   a -= 16;
31229a97285SShri Abhyankar 
31329a97285SShri Abhyankar   for (k = 1; k <= 14; ++k) {
31429a97285SShri Abhyankar     kp1 = k + 1;
31529a97285SShri Abhyankar     k3  = 15*k;
31629a97285SShri Abhyankar     k4  = k3 + k;
31729a97285SShri Abhyankar     /* find l = pivot index */
31829a97285SShri Abhyankar 
31929a97285SShri Abhyankar     i__2 = 16 - k;
32029a97285SShri Abhyankar     aa   = &a[k4];
32129a97285SShri Abhyankar     max  = PetscAbsScalar(aa[0]);
32229a97285SShri Abhyankar     l    = 1;
32329a97285SShri Abhyankar     for (ll=1; ll<i__2; ll++) {
32429a97285SShri Abhyankar       tmp = PetscAbsScalar(aa[ll]);
32529a97285SShri Abhyankar       if (tmp > max) { max = tmp; l = ll+1;}
32629a97285SShri Abhyankar     }
32729a97285SShri Abhyankar     l        += k - 1;
32829a97285SShri Abhyankar     ipvt[k-1] = l;
32929a97285SShri Abhyankar 
33065e19b50SBarry Smith     if (a[l + k3] == 0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",k-1);
33129a97285SShri Abhyankar 
33229a97285SShri Abhyankar     /* interchange if necessary */
33329a97285SShri Abhyankar 
33429a97285SShri Abhyankar     if (l != k) {
33529a97285SShri Abhyankar       stmp      = a[l + k3];
33629a97285SShri Abhyankar       a[l + k3] = a[k4];
33729a97285SShri Abhyankar       a[k4]     = stmp;
33829a97285SShri Abhyankar     }
33929a97285SShri Abhyankar 
34029a97285SShri Abhyankar     /* compute multipliers */
34129a97285SShri Abhyankar 
34229a97285SShri Abhyankar     stmp = -1. / a[k4];
34329a97285SShri Abhyankar     i__2 = 15 - k;
34429a97285SShri Abhyankar     aa = &a[1 + k4];
34526fbe8dcSKarl Rupp     for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
34629a97285SShri Abhyankar 
34729a97285SShri Abhyankar     /* row elimination with column indexing */
34829a97285SShri Abhyankar 
34929a97285SShri Abhyankar     ax = &a[k4+1];
35029a97285SShri Abhyankar     for (j = kp1; j <= 15; ++j) {
35129a97285SShri Abhyankar       j3   = 15*j;
35229a97285SShri Abhyankar       stmp = a[l + j3];
35329a97285SShri Abhyankar       if (l != k) {
35429a97285SShri Abhyankar         a[l + j3] = a[k + j3];
35529a97285SShri Abhyankar         a[k + j3] = stmp;
35629a97285SShri Abhyankar       }
35729a97285SShri Abhyankar 
35829a97285SShri Abhyankar       i__3 = 15 - k;
35929a97285SShri Abhyankar       ay = &a[1+k+j3];
36026fbe8dcSKarl Rupp       for (ll=0; ll<i__3; ll++) ay[ll] += stmp*ax[ll];
36129a97285SShri Abhyankar     }
36229a97285SShri Abhyankar   }
36329a97285SShri Abhyankar   ipvt[14] = 15;
364922032d7SHong Zhang   if (a[240] == 0.0) {
365922032d7SHong Zhang     PetscErrorCode ierr;
366922032d7SHong Zhang     if (allowzeropivot) {
367922032d7SHong Zhang       ierr = PetscInfo1(NULL,"Zero pivot, row %D\n",6);CHKERRQ(ierr);
368922032d7SHong Zhang       *zeropivotdetected = PETSC_TRUE;
369922032d7SHong Zhang     } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D",6);
370922032d7SHong Zhang   }
37129a97285SShri Abhyankar 
37229a97285SShri Abhyankar   /*
37329a97285SShri Abhyankar    Now form the inverse
37429a97285SShri Abhyankar   */
37529a97285SShri Abhyankar 
37629a97285SShri Abhyankar   /* compute inverse(u) */
37729a97285SShri Abhyankar 
37829a97285SShri Abhyankar   for (k = 1; k <= 15; ++k) {
37929a97285SShri Abhyankar     k3    = 15*k;
38029a97285SShri Abhyankar     k4    = k3 + k;
38129a97285SShri Abhyankar     a[k4] = 1.0 / a[k4];
38229a97285SShri Abhyankar     stmp  = -a[k4];
38329a97285SShri Abhyankar     i__2  = k - 1;
38429a97285SShri Abhyankar     aa    = &a[k3 + 1];
38529a97285SShri Abhyankar     for (ll=0; ll<i__2; ll++) aa[ll] *= stmp;
38629a97285SShri Abhyankar     kp1 = k + 1;
38729a97285SShri Abhyankar     if (15 < kp1) continue;
38829a97285SShri Abhyankar     ax = aa;
38929a97285SShri Abhyankar     for (j = kp1; j <= 15; ++j) {
39029a97285SShri Abhyankar       j3        = 15*j;
39129a97285SShri Abhyankar       stmp      = a[k + j3];
39229a97285SShri Abhyankar       a[k + j3] = 0.0;
39329a97285SShri Abhyankar       ay        = &a[j3 + 1];
39426fbe8dcSKarl Rupp       for (ll=0; ll<k; ll++) ay[ll] += stmp*ax[ll];
39529a97285SShri Abhyankar     }
39629a97285SShri Abhyankar   }
39729a97285SShri Abhyankar 
39829a97285SShri Abhyankar   /* form inverse(u)*inverse(l) */
39929a97285SShri Abhyankar 
40029a97285SShri Abhyankar   for (kb = 1; kb <= 14; ++kb) {
40129a97285SShri Abhyankar     k   = 15 - kb;
40229a97285SShri Abhyankar     k3  = 15*k;
40329a97285SShri Abhyankar     kp1 = k + 1;
40429a97285SShri Abhyankar     aa  = a + k3;
40529a97285SShri Abhyankar     for (i = kp1; i <= 15; ++i) {
40629a97285SShri Abhyankar       work[i-1] = aa[i];
40729a97285SShri Abhyankar       aa[i]     = 0.0;
40829a97285SShri Abhyankar     }
40929a97285SShri Abhyankar     for (j = kp1; j <= 15; ++j) {
41029a97285SShri Abhyankar       stmp    = work[j-1];
41129a97285SShri Abhyankar       ax      = &a[15*j + 1];
41229a97285SShri Abhyankar       ay      = &a[k3 + 1];
41329a97285SShri Abhyankar       ay[0]  += stmp*ax[0];
41429a97285SShri Abhyankar       ay[1]  += stmp*ax[1];
41529a97285SShri Abhyankar       ay[2]  += stmp*ax[2];
41629a97285SShri Abhyankar       ay[3]  += stmp*ax[3];
41729a97285SShri Abhyankar       ay[4]  += stmp*ax[4];
41829a97285SShri Abhyankar       ay[5]  += stmp*ax[5];
41929a97285SShri Abhyankar       ay[6]  += stmp*ax[6];
42029a97285SShri Abhyankar       ay[7]  += stmp*ax[7];
42129a97285SShri Abhyankar       ay[8]  += stmp*ax[8];
42229a97285SShri Abhyankar       ay[9]  += stmp*ax[9];
42329a97285SShri Abhyankar       ay[10] += stmp*ax[10];
42429a97285SShri Abhyankar       ay[11] += stmp*ax[11];
42529a97285SShri Abhyankar       ay[12] += stmp*ax[12];
42629a97285SShri Abhyankar       ay[13] += stmp*ax[13];
42729a97285SShri Abhyankar       ay[14] += stmp*ax[14];
42829a97285SShri Abhyankar     }
42929a97285SShri Abhyankar     l = ipvt[k-1];
43029a97285SShri Abhyankar     if (l != k) {
43129a97285SShri Abhyankar       ax   = &a[k3 + 1];
43229a97285SShri Abhyankar       ay   = &a[15*l + 1];
43329a97285SShri Abhyankar       stmp = ax[0];  ax[0]  = ay[0];  ay[0]  = stmp;
43429a97285SShri Abhyankar       stmp = ax[1];  ax[1]  = ay[1];  ay[1]  = stmp;
43529a97285SShri Abhyankar       stmp = ax[2];  ax[2]  = ay[2];  ay[2]  = stmp;
43629a97285SShri Abhyankar       stmp = ax[3];  ax[3]  = ay[3];  ay[3]  = stmp;
43729a97285SShri Abhyankar       stmp = ax[4];  ax[4]  = ay[4];  ay[4]  = stmp;
43829a97285SShri Abhyankar       stmp = ax[5];  ax[5]  = ay[5];  ay[5]  = stmp;
43929a97285SShri Abhyankar       stmp = ax[6];  ax[6]  = ay[6];  ay[6]  = stmp;
44029a97285SShri Abhyankar       stmp = ax[7];  ax[7]  = ay[7];  ay[7]  = stmp;
44129a97285SShri Abhyankar       stmp = ax[8];  ax[8]  = ay[8];  ay[8]  = stmp;
44229a97285SShri Abhyankar       stmp = ax[9];  ax[9]  = ay[9];  ay[9]  = stmp;
44329a97285SShri Abhyankar       stmp = ax[10]; ax[10] = ay[10]; ay[10] = stmp;
44429a97285SShri Abhyankar       stmp = ax[11]; ax[11] = ay[11]; ay[11] = stmp;
44529a97285SShri Abhyankar       stmp = ax[12]; ax[12] = ay[12]; ay[12] = stmp;
44629a97285SShri Abhyankar       stmp = ax[13]; ax[13] = ay[13]; ay[13] = stmp;
44729a97285SShri Abhyankar       stmp = ax[14]; ax[14] = ay[14]; ay[14] = stmp;
44829a97285SShri Abhyankar     }
44929a97285SShri Abhyankar   }
45029a97285SShri Abhyankar   PetscFunctionReturn(0);
45129a97285SShri Abhyankar }
452