xref: /petsc/src/mat/impls/aij/mpi/pastix/pastix.c (revision 43801a6986a6427ff2fa0944d903e5c3523217e2)
13bf14a46SMatthew Knepley #define PETSCMAT_DLL
23bf14a46SMatthew Knepley 
33bf14a46SMatthew Knepley /*
43bf14a46SMatthew Knepley     Provides an interface to the PaStiX sparse solver
53bf14a46SMatthew Knepley */
63bf14a46SMatthew Knepley #include "../src/mat/impls/aij/seq/aij.h"
73bf14a46SMatthew Knepley #include "../src/mat/impls/aij/mpi/mpiaij.h"
83bf14a46SMatthew Knepley #include "../src/mat/impls/sbaij/seq/sbaij.h"
93bf14a46SMatthew Knepley #include "../src/mat/impls/sbaij/mpi/mpisbaij.h"
103bf14a46SMatthew Knepley 
11*43801a69SSatish Balay #if defined(PETSC_HAVE_STDLIB_H)
12*43801a69SSatish Balay #include <stdlib.h>
13*43801a69SSatish Balay #endif
14*43801a69SSatish Balay #if defined(PETSC_HAVE_STRING_H)
15*43801a69SSatish Balay #include <string.h>
16*43801a69SSatish Balay #endif
17*43801a69SSatish Balay 
183bf14a46SMatthew Knepley EXTERN_C_BEGIN
193bf14a46SMatthew Knepley #include "mpi.h"
203bf14a46SMatthew Knepley #include "pastix.h"
213bf14a46SMatthew Knepley EXTERN_C_END
223bf14a46SMatthew Knepley 
233bf14a46SMatthew Knepley typedef struct Mat_Pastix_ {
243bf14a46SMatthew Knepley   pastix_data_t *pastix_data;              /* Pastix data storage structure                        */
253bf14a46SMatthew Knepley   MatStructure   matstruc;
263bf14a46SMatthew Knepley   PetscInt       n;                        /* Number of columns in the matrix                      */
273bf14a46SMatthew Knepley   PetscInt       *colptr;                  /* Index of first element of each column in row and val */
283bf14a46SMatthew Knepley   PetscInt       *row;                     /* Row of each element of the matrix                    */
293bf14a46SMatthew Knepley   PetscScalar    *val;                     /* Value of each element of the matrix                  */
303bf14a46SMatthew Knepley   PetscInt       *perm;                    /* Permutation tabular                                  */
313bf14a46SMatthew Knepley   PetscInt       *invp;                    /* Reverse permutation tabular                          */
323bf14a46SMatthew Knepley   PetscScalar    *rhs;                     /* Rhight-hand-side member                              */
333bf14a46SMatthew Knepley   PetscInt       rhsnbr;                   /* Rhight-hand-side number (must be 1)                  */
343bf14a46SMatthew Knepley   PetscInt       iparm[64];                /* Integer parameters                                   */
353bf14a46SMatthew Knepley   double         dparm[64];                /* Floating point parameters                            */
363bf14a46SMatthew Knepley   MPI_Comm       pastix_comm;              /* PaStiX MPI communicator                              */
373bf14a46SMatthew Knepley   PetscMPIInt    commRank;                 /* MPI rank                                             */
383bf14a46SMatthew Knepley   PetscMPIInt    commSize;                 /* MPI communicator size                                */
393bf14a46SMatthew Knepley   PetscTruth     CleanUpPastix;            /* Boolean indicating if we call PaStiX clean step      */
403bf14a46SMatthew Knepley   VecScatter     scat_rhs;
413bf14a46SMatthew Knepley   VecScatter     scat_sol;
423bf14a46SMatthew Knepley   Vec            b_seq,x_seq;
433bf14a46SMatthew Knepley   PetscTruth     isAIJ;
443bf14a46SMatthew Knepley   PetscInt       nSolve;                   /* Number of consecutive solve                          */
453bf14a46SMatthew Knepley   PetscErrorCode (*MatDestroy)(Mat);
463bf14a46SMatthew Knepley } Mat_Pastix;
473bf14a46SMatthew Knepley 
483bf14a46SMatthew Knepley EXTERN PetscErrorCode MatDuplicate_Pastix(Mat,MatDuplicateOption,Mat*);
493bf14a46SMatthew Knepley 
503bf14a46SMatthew Knepley /*
513bf14a46SMatthew Knepley    convert Petsc seqaij matrix to CSC: colptr[n], row[nz], val[nz]
523bf14a46SMatthew Knepley 
533bf14a46SMatthew Knepley   input:
543bf14a46SMatthew Knepley     A       - matrix in seqaij or mpisbaij (bs=1) format
553bf14a46SMatthew Knepley     valOnly - FALSE: spaces are allocated and values are set for the CSC
563bf14a46SMatthew Knepley               TRUE:  Only fill values
573bf14a46SMatthew Knepley   output:
583bf14a46SMatthew Knepley     n       - Size of the matrix
593bf14a46SMatthew Knepley     colptr  - Index of first element of each column in row and val
603bf14a46SMatthew Knepley     row     - Row of each element of the matrix
613bf14a46SMatthew Knepley     values  - Value of each element of the matrix
623bf14a46SMatthew Knepley  */
6341c8de11SBarry Smith PetscErrorCode MatConvertToCSC(Mat A,PetscTruth valOnly,PetscInt *n,PetscInt **colptr,PetscInt **row,PetscScalar **values)
6441c8de11SBarry Smith {
653bf14a46SMatthew Knepley   Mat_SeqAIJ     *aa      = (Mat_SeqAIJ*)A->data;
663bf14a46SMatthew Knepley   PetscInt       *rowptr  = aa->i;
673bf14a46SMatthew Knepley   PetscInt       *col     = aa->j;
683bf14a46SMatthew Knepley   PetscScalar    *rvalues = aa->a;
693bf14a46SMatthew Knepley   PetscInt        m       = A->rmap->N;
70745c78f7SBarry Smith   PetscInt        nnz;
713bf14a46SMatthew Knepley   PetscInt        i,j, k;
723bf14a46SMatthew Knepley   PetscInt        base = 1;
733bf14a46SMatthew Knepley   PetscInt        idx;
743bf14a46SMatthew Knepley   PetscErrorCode  ierr;
753bf14a46SMatthew Knepley   PetscInt        colidx;
763bf14a46SMatthew Knepley   PetscInt       *colcount;
7741c8de11SBarry Smith   PetscTruth      isSBAIJ;
7841c8de11SBarry Smith   PetscTruth      isSeqSBAIJ;
7941c8de11SBarry Smith   PetscTruth      isMpiSBAIJ;
80745c78f7SBarry Smith   PetscTruth      isSym;
813bf14a46SMatthew Knepley 
823bf14a46SMatthew Knepley 
833bf14a46SMatthew Knepley   PetscFunctionBegin;
843bf14a46SMatthew Knepley   /* Allocate the CSC */
853bf14a46SMatthew Knepley 
8641c8de11SBarry Smith   ierr = MatIsSymmetric(A,0.0,&isSym);CHKERRQ(ierr);
8741c8de11SBarry Smith   ierr = PetscTypeCompare((PetscObject)A,MATSBAIJ,&isSBAIJ);CHKERRQ(ierr);
8841c8de11SBarry Smith   ierr = PetscTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr);
8941c8de11SBarry Smith   ierr = PetscTypeCompare((PetscObject)A,MATMPISBAIJ,&isMpiSBAIJ);CHKERRQ(ierr);
903bf14a46SMatthew Knepley 
91745c78f7SBarry Smith   *n = A->cmap->N;
92745c78f7SBarry Smith 
93745c78f7SBarry Smith   /* PaStiX only needs triangular matrix if matrix is symmetric
94745c78f7SBarry Smith    */
9541c8de11SBarry Smith   if (isSym && !(isSBAIJ || isSeqSBAIJ || isMpiSBAIJ)) {
96745c78f7SBarry Smith     nnz = (aa->nz - *n)/2 + *n;
97745c78f7SBarry Smith   }
9841c8de11SBarry Smith   else {
99745c78f7SBarry Smith     nnz     = aa->nz;
1003bf14a46SMatthew Knepley   }
1013bf14a46SMatthew Knepley 
1023bf14a46SMatthew Knepley   if (!valOnly){
1033bf14a46SMatthew Knepley     ierr = PetscMalloc(((*n)+1) *sizeof(PetscInt)   ,colptr );CHKERRQ(ierr);
1043bf14a46SMatthew Knepley     ierr = PetscMalloc( nnz     *sizeof(PetscInt)   ,row);CHKERRQ(ierr);
1053bf14a46SMatthew Knepley     ierr = PetscMalloc( nnz     *sizeof(PetscScalar),values);CHKERRQ(ierr);
1063bf14a46SMatthew Knepley 
10741c8de11SBarry Smith     if (isSBAIJ || isSeqSBAIJ || isMpiSBAIJ) {
10841c8de11SBarry Smith 	ierr = PetscMemcpy (*colptr, rowptr, ((*n)+1)*sizeof(PetscInt));CHKERRQ(ierr);
10941c8de11SBarry Smith 	for (i = 0; i < *n+1; i++)
11041c8de11SBarry Smith 	  (*colptr)[i] += base;
11141c8de11SBarry Smith 	ierr = PetscMemcpy (*row, col, (nnz)*sizeof(PetscInt));CHKERRQ(ierr);
11241c8de11SBarry Smith 	for (i = 0; i < nnz; i++)
11341c8de11SBarry Smith 	  (*row)[i] += base;
11441c8de11SBarry Smith 	ierr = PetscMemcpy (*values, rvalues, (nnz)*sizeof(PetscScalar));CHKERRQ(ierr);
11541c8de11SBarry Smith     } else {
11641c8de11SBarry Smith       ierr = PetscMalloc((*n)*sizeof(PetscInt)   ,&colcount);CHKERRQ(ierr);
11741c8de11SBarry Smith 
1183bf14a46SMatthew Knepley       for (i = 0; i < m; i++)
1193bf14a46SMatthew Knepley 	colcount[i] = 0;
1203bf14a46SMatthew Knepley       /* Fill-in colptr */
1213bf14a46SMatthew Knepley       for (i = 0; i < m; i++)
1223bf14a46SMatthew Knepley 	for (j = rowptr[i]; j < rowptr[i+1]; j++)
123745c78f7SBarry Smith 	  if (!isSym || col[j] <= i)
1243bf14a46SMatthew Knepley 	    colcount[col[j]]++;
125745c78f7SBarry Smith 
1263bf14a46SMatthew Knepley       (*colptr)[0] = base;
1273bf14a46SMatthew Knepley       for (j = 0; j < *n; j++) {
1283bf14a46SMatthew Knepley 	(*colptr)[j+1] = (*colptr)[j] + colcount[j];
129745c78f7SBarry Smith 	/* in next loop we fill starting from (*colptr)[colidx] - base */
1303bf14a46SMatthew Knepley 	colcount[j] = -base;
1313bf14a46SMatthew Knepley       }
1323bf14a46SMatthew Knepley 
1333bf14a46SMatthew Knepley       /* Fill-in rows and values */
1343bf14a46SMatthew Knepley       for (i = 0; i < m; i++) {
1353bf14a46SMatthew Knepley 	for (j = rowptr[i]; j < rowptr[i+1]; j++) {
13641c8de11SBarry Smith 	  if (!isSym || col[j] <= i) {
1373bf14a46SMatthew Knepley 	    colidx = col[j];
1383bf14a46SMatthew Knepley 	    idx    = (*colptr)[colidx] + colcount[colidx];
1393bf14a46SMatthew Knepley 	    (*row)[idx]    = i + base;
1403bf14a46SMatthew Knepley 	    (*values)[idx] = rvalues[j];
1413bf14a46SMatthew Knepley 	    colcount[colidx]++;
1423bf14a46SMatthew Knepley 	  }
1433bf14a46SMatthew Knepley 	}
1443bf14a46SMatthew Knepley       }
14541c8de11SBarry Smith       ierr = PetscFree(colcount);CHKERRQ(ierr);
146745c78f7SBarry Smith     }
14741c8de11SBarry Smith   } else {
148745c78f7SBarry Smith     /* Fill-in only values */
1493bf14a46SMatthew Knepley     for (i = 0; i < m; i++) {
1503bf14a46SMatthew Knepley       for (j = rowptr[i]; j < rowptr[i+1]; j++) {
1513bf14a46SMatthew Knepley 	colidx = col[j];
15241c8de11SBarry Smith 	if ((isSBAIJ || isSeqSBAIJ || isMpiSBAIJ) ||!isSym || col[j] <= i)
153745c78f7SBarry Smith 	  {
154745c78f7SBarry Smith 	    /* look for the value to fill */
155745c78f7SBarry Smith 	    for (k = (*colptr)[colidx] - base;
156745c78f7SBarry Smith 		 k < (*colptr)[colidx + 1] - base;
157745c78f7SBarry Smith 		 k++) {
1583bf14a46SMatthew Knepley 	      if ((*row)[k] == i) {
1593bf14a46SMatthew Knepley 		(*values)[k] = rvalues[j];
1603bf14a46SMatthew Knepley 		break;
1613bf14a46SMatthew Knepley 	      }
1623bf14a46SMatthew Knepley 	    }
163745c78f7SBarry Smith 	    /* shouldn't happen, overflow */
1643bf14a46SMatthew Knepley 	    if (k == (*colptr)[colidx + 1] - base)
1653bf14a46SMatthew Knepley 	      PetscFunctionReturn(1);
1663bf14a46SMatthew Knepley 	  }
1673bf14a46SMatthew Knepley       }
1683bf14a46SMatthew Knepley     }
169745c78f7SBarry Smith   }
170*43801a69SSatish Balay   {
171*43801a69SSatish Balay 
172*43801a69SSatish Balay     pastix_int_t    * tmpcolptr = malloc((*n+1)*sizeof(PetscInt));
173*43801a69SSatish Balay     pastix_int_t    * tmprows   = malloc(nnz*sizeof(PetscInt));
174*43801a69SSatish Balay     pastix_float_t  * tmpvalues = malloc(nnz*sizeof(PetscScalar));
175*43801a69SSatish Balay     if (sizeof(PetscScalar) != sizeof(pastix_float_t))
176*43801a69SSatish Balay       {
177*43801a69SSatish Balay 	SETERRQ2(PETSC_ERR_SUP,"sizeof(PetscScalar) %d != sizeof(pastix_float_t) %d", sizeof(PetscScalar), sizeof(pastix_float_t));
178*43801a69SSatish Balay       }
179*43801a69SSatish Balay 
180*43801a69SSatish Balay     memcpy(tmpcolptr, *colptr, (*n+1)*sizeof(PetscInt));
181*43801a69SSatish Balay     memcpy(tmprows,   *row,    nnz*sizeof(PetscInt));
182*43801a69SSatish Balay     memcpy(tmpvalues, *values, nnz*sizeof(PetscScalar));
183*43801a69SSatish Balay     ierr = PetscFree(*row);CHKERRQ(ierr);
184*43801a69SSatish Balay     ierr = PetscFree(*values);CHKERRQ(ierr);
185*43801a69SSatish Balay 
186*43801a69SSatish Balay     pastix_checkMatrix(MPI_COMM_WORLD, API_VERBOSE_NO,
187*43801a69SSatish Balay 		       ((isSym != 0) ? API_SYM_YES : API_SYM_NO),  API_YES,
188*43801a69SSatish Balay 		       *n, &tmpcolptr, &tmprows, &tmpvalues, NULL, 1);
189*43801a69SSatish Balay 
190*43801a69SSatish Balay     memcpy(*colptr, tmpcolptr, (*n+1)*sizeof(PetscInt));
191*43801a69SSatish Balay     free(tmpcolptr);
192*43801a69SSatish Balay     ierr = PetscMalloc( ((*colptr)[*n]-1)  *sizeof(PetscInt)   ,row);CHKERRQ(ierr);
193*43801a69SSatish Balay     memcpy(*row,    tmprows, ((*colptr)[*n]-1)*sizeof(PetscInt));
194*43801a69SSatish Balay     free(tmprows);
195*43801a69SSatish Balay     ierr = PetscMalloc( ((*colptr)[*n]-1)  *sizeof(PetscScalar),values);CHKERRQ(ierr);
196*43801a69SSatish Balay     memcpy(*values, tmpvalues, ((*colptr)[*n]-1)*sizeof(PetscScalar));
197*43801a69SSatish Balay     free(tmpvalues);
198*43801a69SSatish Balay   }
1993bf14a46SMatthew Knepley   PetscFunctionReturn(0);
2003bf14a46SMatthew Knepley }
2013bf14a46SMatthew Knepley 
2023bf14a46SMatthew Knepley 
2033bf14a46SMatthew Knepley 
2043bf14a46SMatthew Knepley #undef __FUNCT__
2053bf14a46SMatthew Knepley #define __FUNCT__ "MatDestroy_Pastix"
2063bf14a46SMatthew Knepley /*
2073bf14a46SMatthew Knepley   Call clean step of PaStiX if lu->CleanUpPastix == true.
2083bf14a46SMatthew Knepley   Free the CSC matrix.
2093bf14a46SMatthew Knepley  */
2103bf14a46SMatthew Knepley PetscErrorCode MatDestroy_Pastix(Mat A)
2113bf14a46SMatthew Knepley {
2123bf14a46SMatthew Knepley   Mat_Pastix      *lu=(Mat_Pastix*)A->spptr;
2133bf14a46SMatthew Knepley   PetscErrorCode   ierr;
2143bf14a46SMatthew Knepley   PetscMPIInt      size=lu->commSize;
215745c78f7SBarry Smith 
2163bf14a46SMatthew Knepley   PetscFunctionBegin;
2173bf14a46SMatthew Knepley   if (lu->CleanUpPastix) {
2183bf14a46SMatthew Knepley     /* Terminate instance, deallocate memories */
2193bf14a46SMatthew Knepley     if (size > 1){
2203bf14a46SMatthew Knepley       ierr = VecScatterDestroy(lu->scat_rhs);CHKERRQ(ierr);
2213bf14a46SMatthew Knepley       ierr = VecDestroy(lu->b_seq);CHKERRQ(ierr);
2223bf14a46SMatthew Knepley       if (lu->nSolve && lu->scat_sol){ierr = VecScatterDestroy(lu->scat_sol);CHKERRQ(ierr);}
2233bf14a46SMatthew Knepley       if (lu->nSolve && lu->x_seq){ierr = VecDestroy(lu->x_seq);CHKERRQ(ierr);}
2243bf14a46SMatthew Knepley     }
2253bf14a46SMatthew Knepley 
2263bf14a46SMatthew Knepley     lu->iparm[IPARM_START_TASK]=API_TASK_CLEAN;
2273bf14a46SMatthew Knepley     lu->iparm[IPARM_END_TASK]=API_TASK_CLEAN;
2283bf14a46SMatthew Knepley 
2293bf14a46SMatthew Knepley     pastix((pastix_data_t **)&(lu->pastix_data),
2303bf14a46SMatthew Knepley 	                      lu->pastix_comm,
2313bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->n,
2323bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->colptr,
2333bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->row,
2343bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->val,
2353bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->perm,
2363bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->invp,
2373bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->rhs,
2383bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->rhsnbr,
2393bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->iparm,
2403bf14a46SMatthew Knepley 	                      lu->dparm);
2413bf14a46SMatthew Knepley 
2423bf14a46SMatthew Knepley     ierr = PetscFree(lu->colptr);CHKERRQ(ierr);
2433bf14a46SMatthew Knepley     ierr = PetscFree(lu->row);  CHKERRQ(ierr);
2443bf14a46SMatthew Knepley     ierr = PetscFree(lu->val);  CHKERRQ(ierr);
2453bf14a46SMatthew Knepley     ierr = PetscFree(lu->perm); CHKERRQ(ierr);
2463bf14a46SMatthew Knepley     ierr = PetscFree(lu->invp); CHKERRQ(ierr);
2473bf14a46SMatthew Knepley /*     ierr = PetscFree(lu->rhs);  CHKERRQ(ierr); */
2483bf14a46SMatthew Knepley     ierr = MPI_Comm_free(&(lu->pastix_comm));CHKERRQ(ierr);
2493bf14a46SMatthew Knepley   }
2503bf14a46SMatthew Knepley   ierr = (lu->MatDestroy)(A);CHKERRQ(ierr);
2513bf14a46SMatthew Knepley   PetscFunctionReturn(0);
2523bf14a46SMatthew Knepley }
2533bf14a46SMatthew Knepley 
2543bf14a46SMatthew Knepley #undef __FUNCT__
2553bf14a46SMatthew Knepley #define __FUNCT__ "MatSolve_PaStiX"
2563bf14a46SMatthew Knepley /*
2573bf14a46SMatthew Knepley   Gather right-hand-side.
2583bf14a46SMatthew Knepley   Call for Solve step.
2593bf14a46SMatthew Knepley   Scatter solution.
2603bf14a46SMatthew Knepley  */
2613bf14a46SMatthew Knepley PetscErrorCode MatSolve_PaStiX(Mat A,Vec b,Vec x)
2623bf14a46SMatthew Knepley {
2633bf14a46SMatthew Knepley   Mat_Pastix     *lu=(Mat_Pastix*)A->spptr;
2643bf14a46SMatthew Knepley   PetscScalar    *array;
2653bf14a46SMatthew Knepley   Vec             x_seq;
2663bf14a46SMatthew Knepley   PetscErrorCode  ierr;
2673bf14a46SMatthew Knepley 
2683bf14a46SMatthew Knepley   PetscFunctionBegin;
2693bf14a46SMatthew Knepley   lu->rhsnbr = 1;
2703bf14a46SMatthew Knepley   x_seq = lu->b_seq;
2713bf14a46SMatthew Knepley   if (lu->commSize > 1){
2723bf14a46SMatthew Knepley     /* PaStiX only supports centralized rhs. Scatter b into a seqential rhs vector */
2733bf14a46SMatthew Knepley     ierr = VecScatterBegin(lu->scat_rhs,b,x_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2743bf14a46SMatthew Knepley     ierr = VecScatterEnd(lu->scat_rhs,b,x_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
275b5e56a35SBarry Smith     ierr = VecGetArray(x_seq,&array);CHKERRQ(ierr);
27641c8de11SBarry Smith   } else {  /* size == 1 */
2773bf14a46SMatthew Knepley     ierr = VecCopy(b,x);CHKERRQ(ierr);
2783bf14a46SMatthew Knepley     ierr = VecGetArray(x,&array);CHKERRQ(ierr);
2793bf14a46SMatthew Knepley   }
2803bf14a46SMatthew Knepley   lu->rhs = array;
2813bf14a46SMatthew Knepley   if (lu->commSize == 1){
2823bf14a46SMatthew Knepley     ierr = VecRestoreArray(x,&array);CHKERRQ(ierr);
2833bf14a46SMatthew Knepley   } else {
2843bf14a46SMatthew Knepley     ierr = VecRestoreArray(x_seq,&array);CHKERRQ(ierr);
2853bf14a46SMatthew Knepley   }
2863bf14a46SMatthew Knepley 
2873bf14a46SMatthew Knepley   /* solve phase */
2883bf14a46SMatthew Knepley   /*-------------*/
2893bf14a46SMatthew Knepley   lu->iparm[IPARM_START_TASK] = API_TASK_SOLVE;
2903bf14a46SMatthew Knepley   lu->iparm[IPARM_END_TASK]   = API_TASK_REFINE;
291745c78f7SBarry Smith   lu->iparm[IPARM_RHS_MAKING] = API_RHS_B;
2923bf14a46SMatthew Knepley 
2933bf14a46SMatthew Knepley   pastix((pastix_data_t **)&(lu->pastix_data),
2943bf14a46SMatthew Knepley 	 (MPI_Comm)         lu->pastix_comm,
2953bf14a46SMatthew Knepley 	 (pastix_int_t)     lu->n,
2963bf14a46SMatthew Knepley 	 (pastix_int_t*)    lu->colptr,
2973bf14a46SMatthew Knepley 	 (pastix_int_t*)    lu->row,
2983bf14a46SMatthew Knepley 	 (pastix_float_t*)  lu->val,
2993bf14a46SMatthew Knepley 	 (pastix_int_t*)    lu->perm,
3003bf14a46SMatthew Knepley 	 (pastix_int_t*)    lu->invp,
3013bf14a46SMatthew Knepley 	 (pastix_float_t*)  lu->rhs,
3023bf14a46SMatthew Knepley 	 (pastix_int_t)     lu->rhsnbr,
3033bf14a46SMatthew Knepley 	 (pastix_int_t*)    lu->iparm,
3043bf14a46SMatthew Knepley 	 (double*)          lu->dparm);
3053bf14a46SMatthew Knepley 
3063bf14a46SMatthew Knepley   if (lu->iparm[IPARM_ERROR_NUMBER] < 0) {
307b5e56a35SBarry Smith     SETERRQ1(PETSC_ERR_LIB,"Error reported by PaStiX in solve phase: lu->iparm[IPARM_ERROR_NUMBER] = %d\n",lu->iparm[IPARM_ERROR_NUMBER] );
3083bf14a46SMatthew Knepley   }
3093bf14a46SMatthew Knepley 
3103bf14a46SMatthew Knepley   if (lu->commSize == 1){
3113bf14a46SMatthew Knepley     ierr = VecRestoreArray(x,&(lu->rhs));CHKERRQ(ierr);
3123bf14a46SMatthew Knepley   } else {
3133bf14a46SMatthew Knepley     ierr = VecRestoreArray(x_seq,&(lu->rhs));CHKERRQ(ierr);
3143bf14a46SMatthew Knepley   }
3153bf14a46SMatthew Knepley 
3163bf14a46SMatthew Knepley   if (lu->commSize > 1) { /* convert PaStiX centralized solution to petsc mpi x */
3173bf14a46SMatthew Knepley     ierr = VecScatterBegin(lu->scat_sol,x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3183bf14a46SMatthew Knepley     ierr = VecScatterEnd(lu->scat_sol,x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3193bf14a46SMatthew Knepley   }
3203bf14a46SMatthew Knepley   lu->nSolve++;
3213bf14a46SMatthew Knepley   PetscFunctionReturn(0);
3223bf14a46SMatthew Knepley }
3233bf14a46SMatthew Knepley 
3243bf14a46SMatthew Knepley #if !defined(PETSC_USE_COMPLEX)
3253bf14a46SMatthew Knepley   /*
3263bf14a46SMatthew Knepley      TODO: Fill this function
3273bf14a46SMatthew Knepley      I didn't fill this function
3283bf14a46SMatthew Knepley      because I didn't understood its goal.
3293bf14a46SMatthew Knepley   */
3303bf14a46SMatthew Knepley 
3313bf14a46SMatthew Knepley /*
3323bf14a46SMatthew Knepley   input:
3333bf14a46SMatthew Knepley    F:        numeric factor
3343bf14a46SMatthew Knepley   output:
3353bf14a46SMatthew Knepley    nneg:     total number of pivots
3363bf14a46SMatthew Knepley    nzero:    0
3373bf14a46SMatthew Knepley    npos:     (global dimension of F) - nneg
3383bf14a46SMatthew Knepley */
3393bf14a46SMatthew Knepley 
3403bf14a46SMatthew Knepley #undef __FUNCT__
3413bf14a46SMatthew Knepley #define __FUNCT__ "MatGetInertia_SBAIJPASTIX"
3423bf14a46SMatthew Knepley PetscErrorCode MatGetInertia_SBAIJPASTIX(Mat F,int *nneg,int *nzero,int *npos)
3433bf14a46SMatthew Knepley {
3443bf14a46SMatthew Knepley   PetscFunctionBegin;
3453bf14a46SMatthew Knepley /*   ierr = MPI_Comm_size(((PetscObject)F)->comm,&size);CHKERRQ(ierr); */
3463bf14a46SMatthew Knepley /*   /\* PASTIX 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK *\/ */
3473bf14a46SMatthew Knepley /*   if (size > 1 && lu->id.ICNTL(13) != 1){ */
3483bf14a46SMatthew Knepley /*     SETERRQ1(PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_pastix_icntl_13 must be set as 1 for correct global matrix inertia\n",lu->id.INFOG(13)); */
3493bf14a46SMatthew Knepley /*   } */
3503bf14a46SMatthew Knepley /*   if (nneg){ */
3513bf14a46SMatthew Knepley /*     if (!lu->commSize){ */
3523bf14a46SMatthew Knepley /*       *nneg = lu->id.INFOG(12); */
3533bf14a46SMatthew Knepley /*     } */
3543bf14a46SMatthew Knepley /*     ierr = MPI_Bcast(nneg,1,MPI_INT,0,lu->comm_pastix);CHKERRQ(ierr); */
3553bf14a46SMatthew Knepley /*   } */
3563bf14a46SMatthew Knepley /*   if (nzero) *nzero = lu->iparm[IPARM_NNZEROS]; */
3573bf14a46SMatthew Knepley /*   if (npos)  *npos  = F->rmap->N - (*nneg); */
3583bf14a46SMatthew Knepley   PetscFunctionReturn(0);
3593bf14a46SMatthew Knepley }
3603bf14a46SMatthew Knepley #endif /* !defined(PETSC_USE_COMPLEX) */
3613bf14a46SMatthew Knepley 
3623bf14a46SMatthew Knepley /*
3633bf14a46SMatthew Knepley   Numeric factorisation using PaStiX solver.
3643bf14a46SMatthew Knepley 
3653bf14a46SMatthew Knepley  */
3663bf14a46SMatthew Knepley #undef __FUNCT__
3673bf14a46SMatthew Knepley #define __FUNCT__ "MatFactorNumeric_PASTIX"
3683bf14a46SMatthew Knepley PetscErrorCode MatFactorNumeric_PaStiX(Mat F,Mat A,const MatFactorInfo *info)
3693bf14a46SMatthew Knepley {
3703bf14a46SMatthew Knepley   Mat_Pastix    *lu =(Mat_Pastix*)(F)->spptr;
37141c8de11SBarry Smith   Mat           *tseq;
3723bf14a46SMatthew Knepley   PetscErrorCode ierr = 0;
373b5e56a35SBarry Smith   PetscInt       icntl;
374b5e56a35SBarry Smith   PetscInt       M=A->rmap->N;
3753bf14a46SMatthew Knepley   PetscTruth     valOnly,flg, isSym;
3763bf14a46SMatthew Knepley   Mat            F_diag;
3773bf14a46SMatthew Knepley   IS             is_iden;
3783bf14a46SMatthew Knepley   Vec            b;
3793bf14a46SMatthew Knepley   IS             isrow;
3803bf14a46SMatthew Knepley   PetscTruth     isSeqAIJ,isSeqSBAIJ;
3813bf14a46SMatthew Knepley 
3823bf14a46SMatthew Knepley   PetscFunctionBegin;
38341c8de11SBarry Smith 
3843bf14a46SMatthew Knepley   ierr = PetscTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr);
3853bf14a46SMatthew Knepley   ierr = PetscTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr);
3863bf14a46SMatthew Knepley   if (lu->matstruc == DIFFERENT_NONZERO_PATTERN){
3873bf14a46SMatthew Knepley     (F)->ops->solve   = MatSolve_PaStiX;
3883bf14a46SMatthew Knepley 
3893bf14a46SMatthew Knepley     /* Initialize a PASTIX instance */
3903bf14a46SMatthew Knepley     ierr = MPI_Comm_dup(((PetscObject)A)->comm,&(lu->pastix_comm));CHKERRQ(ierr);
3913bf14a46SMatthew Knepley     ierr = MPI_Comm_rank(lu->pastix_comm, &lu->commRank);         CHKERRQ(ierr);
3923bf14a46SMatthew Knepley     ierr = MPI_Comm_size(lu->pastix_comm, &lu->commSize);         CHKERRQ(ierr);
3933bf14a46SMatthew Knepley 
3943bf14a46SMatthew Knepley     /* Set pastix options */
3953bf14a46SMatthew Knepley     lu->iparm[IPARM_MODIFY_PARAMETER] = API_NO;
3963bf14a46SMatthew Knepley     lu->iparm[IPARM_START_TASK]       = API_TASK_INIT;
3973bf14a46SMatthew Knepley     lu->iparm[IPARM_END_TASK]         = API_TASK_INIT;
3983bf14a46SMatthew Knepley     lu->rhsnbr = 1;
3993bf14a46SMatthew Knepley 
4003bf14a46SMatthew Knepley     /* Call to set default pastix options */
4013bf14a46SMatthew Knepley     pastix((pastix_data_t **)&(lu->pastix_data),
4023bf14a46SMatthew Knepley 	   (MPI_Comm)         lu->pastix_comm,
4033bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->n,
4043bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->colptr,
4053bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->row,
4063bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->val,
4073bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->perm,
4083bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->invp,
4093bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->rhs,
4103bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->rhsnbr,
4113bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->iparm,
4123bf14a46SMatthew Knepley 	   (double*)          lu->dparm);
4133bf14a46SMatthew Knepley 
4143bf14a46SMatthew Knepley     ierr = PetscOptionsBegin(((PetscObject)A)->comm,((PetscObject)A)->prefix,"PaStiX Options","Mat");CHKERRQ(ierr);
4153bf14a46SMatthew Knepley 
4163bf14a46SMatthew Knepley     icntl=-1;
41741c8de11SBarry Smith     lu->iparm[IPARM_VERBOSE] = API_VERBOSE_NOT;
41841c8de11SBarry Smith     ierr = PetscOptionsInt("-mat_pastix_verbose","iparm[IPARM_VERBOSE] : level of printing (0 to 2)","None",lu->iparm[IPARM_VERBOSE],&icntl,&flg);CHKERRQ(ierr);
4193bf14a46SMatthew Knepley     if ((flg && icntl > 0) || PetscLogPrintInfo) {
4203bf14a46SMatthew Knepley       lu->iparm[IPARM_VERBOSE] =  icntl;
4213bf14a46SMatthew Knepley     }
4223bf14a46SMatthew Knepley     icntl=-1;
42341c8de11SBarry Smith     ierr = PetscOptionsInt("-mat_pastix_threadnbr","iparm[IPARM_THREAD_NBR] : Number of thread by MPI node","None",lu->iparm[IPARM_THREAD_NBR],&icntl,PETSC_NULL);CHKERRQ(ierr);
4243bf14a46SMatthew Knepley     if ((flg && icntl > 0)) {
4253bf14a46SMatthew Knepley       lu->iparm[IPARM_THREAD_NBR] = icntl;
4263bf14a46SMatthew Knepley     }
4273bf14a46SMatthew Knepley     PetscOptionsEnd();
4283bf14a46SMatthew Knepley     valOnly = PETSC_FALSE;
42941c8de11SBarry Smith   }  else {
4303bf14a46SMatthew Knepley     valOnly = PETSC_TRUE;
4313bf14a46SMatthew Knepley   }
4323bf14a46SMatthew Knepley 
4333bf14a46SMatthew Knepley   lu->iparm[IPARM_MATRIX_VERIFICATION] = API_YES;
4343bf14a46SMatthew Knepley 
4353bf14a46SMatthew Knepley   /* convert mpi A to seq mat A */
4363bf14a46SMatthew Knepley   ierr = ISCreateStride(PETSC_COMM_SELF,M,0,1,&isrow);CHKERRQ(ierr);
4373bf14a46SMatthew Knepley   ierr = MatGetSubMatrices(A,1,&isrow,&isrow,MAT_INITIAL_MATRIX,&tseq);CHKERRQ(ierr);
4383bf14a46SMatthew Knepley   ierr = ISDestroy(isrow);CHKERRQ(ierr);
4393bf14a46SMatthew Knepley 
44041c8de11SBarry Smith   ierr = MatConvertToCSC(*tseq,valOnly, &lu->n, &lu->colptr, &lu->row, &lu->val);CHKERRQ(ierr);
44141c8de11SBarry Smith   ierr = MatIsSymmetric(*tseq,0.0,&isSym);CHKERRQ(ierr);
44241c8de11SBarry Smith   ierr = MatDestroyMatrices(1,&tseq);CHKERRQ(ierr);
44341c8de11SBarry Smith 
4443bf14a46SMatthew Knepley   ierr = PetscMalloc((lu->n)*sizeof(PetscInt)   ,&(lu->perm));CHKERRQ(ierr);
4453bf14a46SMatthew Knepley   ierr = PetscMalloc((lu->n)*sizeof(PetscInt)   ,&(lu->invp));CHKERRQ(ierr);
4463bf14a46SMatthew Knepley 
4473bf14a46SMatthew Knepley 
4483bf14a46SMatthew Knepley   if (isSym) {
449745c78f7SBarry Smith     /* On symmetric matrix, LLT */
4503bf14a46SMatthew Knepley     lu->iparm[IPARM_SYM] = API_SYM_YES;
45141c8de11SBarry Smith     lu->iparm[IPARM_FACTORIZATION] = API_FACT_LDLT;
4523bf14a46SMatthew Knepley   }
4533bf14a46SMatthew Knepley   else {
454745c78f7SBarry Smith     /* On unsymmetric matrix, LU */
4553bf14a46SMatthew Knepley     lu->iparm[IPARM_SYM] = API_SYM_NO;
4563bf14a46SMatthew Knepley     lu->iparm[IPARM_FACTORIZATION] = API_FACT_LU;
4573bf14a46SMatthew Knepley   }
4583bf14a46SMatthew Knepley 
4593bf14a46SMatthew Knepley   /*----------------*/
4603bf14a46SMatthew Knepley   if (lu->matstruc == DIFFERENT_NONZERO_PATTERN){
4613bf14a46SMatthew Knepley     if (!(isSeqAIJ || isSeqSBAIJ)) {
4623bf14a46SMatthew Knepley       /* PaStiX only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
4633bf14a46SMatthew Knepley 	ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&lu->b_seq);CHKERRQ(ierr);
4643bf14a46SMatthew Knepley 	ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
4653bf14a46SMatthew Knepley 	ierr = VecCreate(((PetscObject)A)->comm,&b);CHKERRQ(ierr);
4663bf14a46SMatthew Knepley 	ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
4673bf14a46SMatthew Knepley 	ierr = VecSetFromOptions(b);CHKERRQ(ierr);
4683bf14a46SMatthew Knepley 
4693bf14a46SMatthew Knepley 	ierr = VecScatterCreate(b,is_iden,lu->b_seq,is_iden,&lu->scat_rhs);CHKERRQ(ierr);
4703bf14a46SMatthew Knepley 	ierr = VecScatterCreate(lu->b_seq,is_iden,b,is_iden,&lu->scat_sol);CHKERRQ(ierr);
4713bf14a46SMatthew Knepley 	ierr = ISDestroy(is_iden);CHKERRQ(ierr);
4723bf14a46SMatthew Knepley 	ierr = VecDestroy(b);CHKERRQ(ierr);
4733bf14a46SMatthew Knepley     }
4743bf14a46SMatthew Knepley     lu->iparm[IPARM_START_TASK] = API_TASK_ORDERING;
4753bf14a46SMatthew Knepley     lu->iparm[IPARM_END_TASK]   = API_TASK_NUMFACT;
4763bf14a46SMatthew Knepley 
4773bf14a46SMatthew Knepley     pastix((pastix_data_t **)&(lu->pastix_data),
4783bf14a46SMatthew Knepley 	   (MPI_Comm)         lu->pastix_comm,
4793bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->n,
4803bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->colptr,
4813bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->row,
4823bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->val,
4833bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->perm,
4843bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->invp,
4853bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->rhs,
4863bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->rhsnbr,
4873bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->iparm,
4883bf14a46SMatthew Knepley 	   (double*)          lu->dparm);
4893bf14a46SMatthew Knepley     if (lu->iparm[IPARM_ERROR_NUMBER] < 0) {
49041c8de11SBarry Smith       SETERRQ1(PETSC_ERR_LIB,"Error reported by PaStiX in analysis phase: iparm(IPARM_ERROR_NUMBER)=%d\n",lu->iparm[IPARM_ERROR_NUMBER]);
4913bf14a46SMatthew Knepley     }
49241c8de11SBarry Smith   } else {
4933bf14a46SMatthew Knepley     lu->iparm[IPARM_START_TASK] = API_TASK_NUMFACT;
4943bf14a46SMatthew Knepley     lu->iparm[IPARM_END_TASK]   = API_TASK_NUMFACT;
4953bf14a46SMatthew Knepley     pastix((pastix_data_t **)&(lu->pastix_data),
4963bf14a46SMatthew Knepley 	   (MPI_Comm)         lu->pastix_comm,
4973bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->n,
4983bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->colptr,
4993bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->row,
5003bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->val,
5013bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->perm,
5023bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->invp,
5033bf14a46SMatthew Knepley 	   (pastix_float_t*)  lu->rhs,
5043bf14a46SMatthew Knepley 	   (pastix_int_t)     lu->rhsnbr,
5053bf14a46SMatthew Knepley 	   (pastix_int_t*)    lu->iparm,
5063bf14a46SMatthew Knepley 	   (double*)          lu->dparm);
5073bf14a46SMatthew Knepley 
5083bf14a46SMatthew Knepley     if (lu->iparm[IPARM_ERROR_NUMBER] < 0) {
50941c8de11SBarry Smith       SETERRQ1(PETSC_ERR_LIB,"Error reported by PaStiX in analysis phase: iparm(IPARM_ERROR_NUMBER)=%d\n",lu->iparm[IPARM_ERROR_NUMBER]);
5103bf14a46SMatthew Knepley     }
5113bf14a46SMatthew Knepley   }
5123bf14a46SMatthew Knepley 
5133bf14a46SMatthew Knepley   if (lu->commSize > 1){
5143bf14a46SMatthew Knepley     if ((F)->factor == MAT_FACTOR_LU){
5153bf14a46SMatthew Knepley       F_diag = ((Mat_MPIAIJ *)(F)->data)->A;
5163bf14a46SMatthew Knepley     } else {
5173bf14a46SMatthew Knepley       F_diag = ((Mat_MPISBAIJ *)(F)->data)->A;
5183bf14a46SMatthew Knepley     }
5193bf14a46SMatthew Knepley     F_diag->assembled = PETSC_TRUE;
5203bf14a46SMatthew Knepley     if (lu->nSolve){
5213bf14a46SMatthew Knepley       ierr = VecScatterDestroy(lu->scat_sol);CHKERRQ(ierr);
5223bf14a46SMatthew Knepley       ierr = VecDestroy(lu->x_seq);CHKERRQ(ierr);
5233bf14a46SMatthew Knepley     }
5243bf14a46SMatthew Knepley   }
5253bf14a46SMatthew Knepley   (F)->assembled     = PETSC_TRUE;
5263bf14a46SMatthew Knepley   lu->matstruc       = SAME_NONZERO_PATTERN;
5273bf14a46SMatthew Knepley   lu->CleanUpPastix  = PETSC_TRUE;
5283bf14a46SMatthew Knepley   lu->nSolve         = 0;
5293bf14a46SMatthew Knepley   PetscFunctionReturn(0);
5303bf14a46SMatthew Knepley }
5313bf14a46SMatthew Knepley 
5323bf14a46SMatthew Knepley 
5333bf14a46SMatthew Knepley /* Note the Petsc r and c permutations are ignored */
5343bf14a46SMatthew Knepley #undef __FUNCT__
5353bf14a46SMatthew Knepley #define __FUNCT__ "MatLUFactorSymbolic_AIJPASTIX"
5363bf14a46SMatthew Knepley PetscErrorCode MatLUFactorSymbolic_AIJPASTIX(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info)
5373bf14a46SMatthew Knepley {
5383bf14a46SMatthew Knepley   Mat_Pastix      *lu = (Mat_Pastix*)F->spptr;
5393bf14a46SMatthew Knepley 
5403bf14a46SMatthew Knepley   PetscFunctionBegin;
5413bf14a46SMatthew Knepley   lu->iparm[IPARM_FACTORIZATION] = API_FACT_LU;
5423bf14a46SMatthew Knepley   lu->iparm[IPARM_SYM]           = API_SYM_YES;
5433bf14a46SMatthew Knepley   lu->matstruc                   = DIFFERENT_NONZERO_PATTERN;
5443bf14a46SMatthew Knepley   F->ops->lufactornumeric        = MatFactorNumeric_PaStiX;
5453bf14a46SMatthew Knepley   PetscFunctionReturn(0);
5463bf14a46SMatthew Knepley }
5473bf14a46SMatthew Knepley 
5483bf14a46SMatthew Knepley 
5493bf14a46SMatthew Knepley /* Note the Petsc r permutation is ignored */
5503bf14a46SMatthew Knepley #undef __FUNCT__
5513bf14a46SMatthew Knepley #define __FUNCT__ "MatCholeskyFactorSymbolic_SBAIJPASTIX"
5523bf14a46SMatthew Knepley PetscErrorCode MatCholeskyFactorSymbolic_SBAIJPASTIX(Mat F,Mat A,IS r,const MatFactorInfo *info)
5533bf14a46SMatthew Knepley {
5543bf14a46SMatthew Knepley   Mat_Pastix      *lu = (Mat_Pastix*)(F)->spptr;
5553bf14a46SMatthew Knepley 
5563bf14a46SMatthew Knepley   PetscFunctionBegin;
5573bf14a46SMatthew Knepley   lu->iparm[IPARM_FACTORIZATION]  = API_FACT_LLT;
5583bf14a46SMatthew Knepley   lu->iparm[IPARM_SYM]            = API_SYM_NO;
5593bf14a46SMatthew Knepley   lu->matstruc                    = DIFFERENT_NONZERO_PATTERN;
5603bf14a46SMatthew Knepley   (F)->ops->choleskyfactornumeric = MatFactorNumeric_PaStiX;
5613bf14a46SMatthew Knepley #if !defined(PETSC_USE_COMPLEX)
5623bf14a46SMatthew Knepley   (F)->ops->getinertia            = MatGetInertia_SBAIJPASTIX;
5633bf14a46SMatthew Knepley #endif
5643bf14a46SMatthew Knepley   PetscFunctionReturn(0);
5653bf14a46SMatthew Knepley }
5663bf14a46SMatthew Knepley 
5673bf14a46SMatthew Knepley #undef __FUNCT__
5683bf14a46SMatthew Knepley #define __FUNCT__ "MatView_PaStiX"
5693bf14a46SMatthew Knepley PetscErrorCode MatView_PaStiX(Mat A,PetscViewer viewer)
5703bf14a46SMatthew Knepley {
5713bf14a46SMatthew Knepley   PetscErrorCode    ierr;
5723bf14a46SMatthew Knepley   PetscTruth        iascii;
5733bf14a46SMatthew Knepley   PetscViewerFormat format;
5743bf14a46SMatthew Knepley 
5753bf14a46SMatthew Knepley   PetscFunctionBegin;
5763bf14a46SMatthew Knepley   ierr = PetscTypeCompare((PetscObject)viewer,PETSC_VIEWER_ASCII,&iascii);CHKERRQ(ierr);
5773bf14a46SMatthew Knepley   if (iascii) {
5783bf14a46SMatthew Knepley     ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
5793bf14a46SMatthew Knepley     if (format == PETSC_VIEWER_ASCII_INFO){
580b5e56a35SBarry Smith       Mat_Pastix      *lu=(Mat_Pastix*)A->spptr;
581b5e56a35SBarry Smith 
582b5e56a35SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"PaStiX run parameters:\n");CHKERRQ(ierr);
583b5e56a35SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"  Matrix type :                      %s \n",((lu->iparm[IPARM_SYM] == API_SYM_YES)?"Symmetric":"Unsymmetric"));CHKERRQ(ierr);
584b5e56a35SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"  Level of printing (0,1,2):         %d \n",lu->iparm[IPARM_VERBOSE]);CHKERRQ(ierr);
585b5e56a35SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"  Number of refinements iterations : %d \n",lu->iparm[IPARM_NBITER]);CHKERRQ(ierr);
586b5e56a35SBarry Smith       ierr = PetscPrintf(PETSC_COMM_SELF,"  Error :                        %g \n",lu->dparm[DPARM_RELATIVE_ERROR]);CHKERRQ(ierr);
5873bf14a46SMatthew Knepley     }
5883bf14a46SMatthew Knepley   }
5893bf14a46SMatthew Knepley   PetscFunctionReturn(0);
5903bf14a46SMatthew Knepley }
5913bf14a46SMatthew Knepley 
5923bf14a46SMatthew Knepley 
5933bf14a46SMatthew Knepley /*MC
594b5e56a35SBarry Smith      MAT_SOLVER_PASTIX  - A solver package providing direct solvers (LU) for distributed
5953bf14a46SMatthew Knepley   and sequential matrices via the external package PaStiX.
5963bf14a46SMatthew Knepley 
597b5e56a35SBarry Smith   Use config/configure.py --download-pastix to have PETSc installed with PaStiX
5983bf14a46SMatthew Knepley 
5993bf14a46SMatthew Knepley   Options Database Keys:
600b5e56a35SBarry Smith + -mat_pastix_verbose   <0,1,2>   - print level
601b5e56a35SBarry Smith - -mat_pastix_threadnbr <integer> - Set the thread number by MPI task.
6023bf14a46SMatthew Knepley 
6033bf14a46SMatthew Knepley   Level: beginner
6043bf14a46SMatthew Knepley 
60541c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage
60641c8de11SBarry Smith 
6073bf14a46SMatthew Knepley M*/
6083bf14a46SMatthew Knepley 
6093bf14a46SMatthew Knepley 
6103bf14a46SMatthew Knepley #undef __FUNCT__
6113bf14a46SMatthew Knepley #define __FUNCT__ "MatGetInfo_PaStiX"
6123bf14a46SMatthew Knepley PetscErrorCode MatGetInfo_PaStiX(Mat A,MatInfoType flag,MatInfo *info)
6133bf14a46SMatthew Knepley {
6143bf14a46SMatthew Knepley     Mat_Pastix  *lu =(Mat_Pastix*)A->spptr;
6153bf14a46SMatthew Knepley 
6163bf14a46SMatthew Knepley     PetscFunctionBegin;
6173bf14a46SMatthew Knepley     info->block_size        = 1.0;
6183bf14a46SMatthew Knepley     info->nz_allocated      = lu->iparm[IPARM_NNZEROS];
6193bf14a46SMatthew Knepley     info->nz_used           = lu->iparm[IPARM_NNZEROS];
6203bf14a46SMatthew Knepley     info->nz_unneeded       = 0.0;
6213bf14a46SMatthew Knepley     info->assemblies        = 0.0;
6223bf14a46SMatthew Knepley     info->mallocs           = 0.0;
6233bf14a46SMatthew Knepley     info->memory            = 0.0;
6243bf14a46SMatthew Knepley     info->fill_ratio_given  = 0;
6253bf14a46SMatthew Knepley     info->fill_ratio_needed = 0;
6263bf14a46SMatthew Knepley     info->factor_mallocs    = 0;
6273bf14a46SMatthew Knepley     PetscFunctionReturn(0);
6283bf14a46SMatthew Knepley }
6293bf14a46SMatthew Knepley 
6303bf14a46SMatthew Knepley EXTERN_C_BEGIN
6313bf14a46SMatthew Knepley #undef __FUNCT__
6323bf14a46SMatthew Knepley #define __FUNCT__ "MatFactorGetSolverPackage_pastix"
6333bf14a46SMatthew Knepley PetscErrorCode MatFactorGetSolverPackage_pastix(Mat A,const MatSolverPackage *type)
6343bf14a46SMatthew Knepley {
6353bf14a46SMatthew Knepley   PetscFunctionBegin;
6363bf14a46SMatthew Knepley   *type = MAT_SOLVER_PASTIX;
6373bf14a46SMatthew Knepley   PetscFunctionReturn(0);
6383bf14a46SMatthew Knepley }
6393bf14a46SMatthew Knepley EXTERN_C_END
6403bf14a46SMatthew Knepley 
6413bf14a46SMatthew Knepley EXTERN_C_BEGIN
6423bf14a46SMatthew Knepley /*
6433bf14a46SMatthew Knepley     The seq and mpi versions of this function are the same
6443bf14a46SMatthew Knepley */
6453bf14a46SMatthew Knepley #undef __FUNCT__
6463bf14a46SMatthew Knepley #define __FUNCT__ "MatGetFactor_seqaij_pastix"
6473bf14a46SMatthew Knepley PetscErrorCode MatGetFactor_seqaij_pastix(Mat A,MatFactorType ftype,Mat *F)
6483bf14a46SMatthew Knepley {
6493bf14a46SMatthew Knepley   Mat            B;
6503bf14a46SMatthew Knepley   PetscErrorCode ierr;
6513bf14a46SMatthew Knepley   Mat_Pastix    *pastix;
6523bf14a46SMatthew Knepley 
6533bf14a46SMatthew Knepley   PetscFunctionBegin;
6543bf14a46SMatthew Knepley   if (ftype != MAT_FACTOR_LU) {
6553bf14a46SMatthew Knepley     SETERRQ(PETSC_ERR_SUP,"Cannot use PETSc AIJ matrices with PaStiX Cholesky, use SBAIJ matrix");
6563bf14a46SMatthew Knepley   }
6573bf14a46SMatthew Knepley   /* Create the factorization matrix */
6583bf14a46SMatthew Knepley   ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr);
6593bf14a46SMatthew Knepley   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
6603bf14a46SMatthew Knepley   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
6613bf14a46SMatthew Knepley   ierr = MatSeqAIJSetPreallocation(B,0,PETSC_NULL);CHKERRQ(ierr);
6623bf14a46SMatthew Knepley 
6633bf14a46SMatthew Knepley   B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJPASTIX;
6643bf14a46SMatthew Knepley   B->ops->view             = MatView_PaStiX;
6653bf14a46SMatthew Knepley   B->ops->getinfo          = MatGetInfo_PaStiX;
6663bf14a46SMatthew Knepley   ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatFactorGetSolverPackage_C",
6673bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_pastix",
6683bf14a46SMatthew Knepley 					   MatFactorGetSolverPackage_pastix);CHKERRQ(ierr);
6693bf14a46SMatthew Knepley   B->factor                = MAT_FACTOR_LU;
6703bf14a46SMatthew Knepley 
6713bf14a46SMatthew Knepley   ierr = PetscNewLog(B,Mat_Pastix,&pastix);CHKERRQ(ierr);
6723bf14a46SMatthew Knepley   pastix->CleanUpPastix             = PETSC_FALSE;
6733bf14a46SMatthew Knepley   pastix->isAIJ                     = PETSC_TRUE;
6743bf14a46SMatthew Knepley   pastix->scat_rhs                  = PETSC_NULL;
6753bf14a46SMatthew Knepley   pastix->scat_sol                  = PETSC_NULL;
6763bf14a46SMatthew Knepley   pastix->nSolve                    = 0;
6773bf14a46SMatthew Knepley   pastix->MatDestroy                = B->ops->destroy;
6783bf14a46SMatthew Knepley   B->ops->destroy                   = MatDestroy_Pastix;
6793bf14a46SMatthew Knepley   B->spptr                          = (void*)pastix;
6803bf14a46SMatthew Knepley 
6813bf14a46SMatthew Knepley   *F = B;
6823bf14a46SMatthew Knepley   PetscFunctionReturn(0);
6833bf14a46SMatthew Knepley }
6843bf14a46SMatthew Knepley EXTERN_C_END
6853bf14a46SMatthew Knepley 
686b5e56a35SBarry Smith 
6873bf14a46SMatthew Knepley EXTERN_C_BEGIN
6883bf14a46SMatthew Knepley #undef __FUNCT__
6893bf14a46SMatthew Knepley #define __FUNCT__ "MatGetFactor_mpiaij_pastix"
6903bf14a46SMatthew Knepley PetscErrorCode MatGetFactor_mpiaij_pastix(Mat A,MatFactorType ftype,Mat *F)
6913bf14a46SMatthew Knepley {
6923bf14a46SMatthew Knepley   Mat            B;
6933bf14a46SMatthew Knepley   PetscErrorCode ierr;
6943bf14a46SMatthew Knepley   Mat_Pastix    *pastix;
6953bf14a46SMatthew Knepley 
6963bf14a46SMatthew Knepley   PetscFunctionBegin;
69741c8de11SBarry Smith   if (ftype != MAT_FACTOR_LU) SETERRQ(PETSC_ERR_SUP,"Cannot use PETSc AIJ matrices with PaStiX Cholesky, use SBAIJ matrix");
6983bf14a46SMatthew Knepley   /* Create the factorization matrix */
6993bf14a46SMatthew Knepley   ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr);
7003bf14a46SMatthew Knepley   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
7013bf14a46SMatthew Knepley   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
7023bf14a46SMatthew Knepley   ierr = MatSeqAIJSetPreallocation(B,0,PETSC_NULL);CHKERRQ(ierr);
7033bf14a46SMatthew Knepley   ierr = MatMPIAIJSetPreallocation(B,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr);
7043bf14a46SMatthew Knepley 
7053bf14a46SMatthew Knepley   B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJPASTIX;
7063bf14a46SMatthew Knepley   B->ops->view             = MatView_PaStiX;
7073bf14a46SMatthew Knepley   ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,
7083bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_C",
7093bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_pastix",
7103bf14a46SMatthew Knepley 					   MatFactorGetSolverPackage_pastix);CHKERRQ(ierr);
7113bf14a46SMatthew Knepley   B->factor                = MAT_FACTOR_LU;
7123bf14a46SMatthew Knepley 
7133bf14a46SMatthew Knepley   ierr = PetscNewLog(B,Mat_Pastix,&pastix);CHKERRQ(ierr);
7143bf14a46SMatthew Knepley   pastix->CleanUpPastix             = PETSC_FALSE;
7153bf14a46SMatthew Knepley   pastix->isAIJ                     = PETSC_TRUE;
7163bf14a46SMatthew Knepley   pastix->scat_rhs                  = PETSC_NULL;
7173bf14a46SMatthew Knepley   pastix->scat_sol                  = PETSC_NULL;
7183bf14a46SMatthew Knepley   pastix->nSolve                    = 0;
7193bf14a46SMatthew Knepley   pastix->MatDestroy                = B->ops->destroy;
7203bf14a46SMatthew Knepley   B->ops->destroy                  = MatDestroy_Pastix;
7213bf14a46SMatthew Knepley   B->spptr                         = (void*)pastix;
7223bf14a46SMatthew Knepley 
7233bf14a46SMatthew Knepley   *F = B;
7243bf14a46SMatthew Knepley   PetscFunctionReturn(0);
7253bf14a46SMatthew Knepley }
7263bf14a46SMatthew Knepley EXTERN_C_END
7273bf14a46SMatthew Knepley 
7283bf14a46SMatthew Knepley EXTERN_C_BEGIN
7293bf14a46SMatthew Knepley #undef __FUNCT__
7303bf14a46SMatthew Knepley #define __FUNCT__ "MatGetFactor_seqsbaij_pastix"
7313bf14a46SMatthew Knepley PetscErrorCode MatGetFactor_seqsbaij_pastix(Mat A,MatFactorType ftype,Mat *F)
7323bf14a46SMatthew Knepley {
7333bf14a46SMatthew Knepley   Mat            B;
7343bf14a46SMatthew Knepley   PetscErrorCode ierr;
7353bf14a46SMatthew Knepley   Mat_Pastix    *pastix;
7363bf14a46SMatthew Knepley 
7373bf14a46SMatthew Knepley   PetscFunctionBegin;
7383bf14a46SMatthew Knepley   if (ftype != MAT_FACTOR_CHOLESKY) {
7393bf14a46SMatthew Knepley     SETERRQ(PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with PaStiX LU, use AIJ matrix");
7403bf14a46SMatthew Knepley   }
7413bf14a46SMatthew Knepley   /* Create the factorization matrix */
7423bf14a46SMatthew Knepley   ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr);
7433bf14a46SMatthew Knepley   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
7443bf14a46SMatthew Knepley   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
7453bf14a46SMatthew Knepley   ierr = MatSeqSBAIJSetPreallocation(B,1,0,PETSC_NULL);CHKERRQ(ierr);
7463bf14a46SMatthew Knepley   ierr = MatMPISBAIJSetPreallocation(B,1,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr);
7473bf14a46SMatthew Knepley 
7483bf14a46SMatthew Knepley   B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SBAIJPASTIX;
7493bf14a46SMatthew Knepley   B->ops->view                   = MatView_PaStiX;
7503bf14a46SMatthew Knepley   ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,
7513bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_C",
7523bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_pastix",
7533bf14a46SMatthew Knepley 					   MatFactorGetSolverPackage_pastix);CHKERRQ(ierr);
7543bf14a46SMatthew Knepley 
7553bf14a46SMatthew Knepley   B->factor                      = MAT_FACTOR_CHOLESKY;
7563bf14a46SMatthew Knepley 
7573bf14a46SMatthew Knepley   ierr = PetscNewLog(B,Mat_Pastix,&pastix);CHKERRQ(ierr);
7583bf14a46SMatthew Knepley   pastix->CleanUpPastix             = PETSC_FALSE;
7593bf14a46SMatthew Knepley   pastix->isAIJ                     = PETSC_TRUE;
7603bf14a46SMatthew Knepley   pastix->scat_rhs                  = PETSC_NULL;
7613bf14a46SMatthew Knepley   pastix->scat_sol                  = PETSC_NULL;
7623bf14a46SMatthew Knepley   pastix->nSolve                    = 0;
7633bf14a46SMatthew Knepley   pastix->MatDestroy                = B->ops->destroy;
7643bf14a46SMatthew Knepley   B->ops->destroy                  = MatDestroy_Pastix;
7653bf14a46SMatthew Knepley   B->spptr                         = (void*)pastix;
7663bf14a46SMatthew Knepley 
7673bf14a46SMatthew Knepley   *F = B;
7683bf14a46SMatthew Knepley   PetscFunctionReturn(0);
7693bf14a46SMatthew Knepley }
7703bf14a46SMatthew Knepley EXTERN_C_END
7713bf14a46SMatthew Knepley 
7723bf14a46SMatthew Knepley EXTERN_C_BEGIN
7733bf14a46SMatthew Knepley #undef __FUNCT__
7743bf14a46SMatthew Knepley #define __FUNCT__ "MatGetFactor_mpisbaij_pastix"
7753bf14a46SMatthew Knepley PetscErrorCode MatGetFactor_mpisbaij_pastix(Mat A,MatFactorType ftype,Mat *F)
7763bf14a46SMatthew Knepley {
7773bf14a46SMatthew Knepley   Mat            B;
7783bf14a46SMatthew Knepley   PetscErrorCode ierr;
7793bf14a46SMatthew Knepley   Mat_Pastix    *pastix;
7803bf14a46SMatthew Knepley 
7813bf14a46SMatthew Knepley   PetscFunctionBegin;
78241c8de11SBarry Smith   if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with PaStiX LU, use AIJ matrix");
78341c8de11SBarry Smith 
7843bf14a46SMatthew Knepley   /* Create the factorization matrix */
7853bf14a46SMatthew Knepley   ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr);
7863bf14a46SMatthew Knepley   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
7873bf14a46SMatthew Knepley   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
7883bf14a46SMatthew Knepley   ierr = MatSeqSBAIJSetPreallocation(B,1,0,PETSC_NULL);CHKERRQ(ierr);
7893bf14a46SMatthew Knepley   ierr = MatMPISBAIJSetPreallocation(B,1,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr);
7903bf14a46SMatthew Knepley 
7913bf14a46SMatthew Knepley   B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SBAIJPASTIX;
7923bf14a46SMatthew Knepley   B->ops->view                   = MatView_PaStiX;
7933bf14a46SMatthew Knepley   ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,
7943bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_C",
7953bf14a46SMatthew Knepley 					   "MatFactorGetSolverPackage_pastix",
7963bf14a46SMatthew Knepley 					   MatFactorGetSolverPackage_pastix);CHKERRQ(ierr);
7973bf14a46SMatthew Knepley   B->factor                      = MAT_FACTOR_CHOLESKY;
7983bf14a46SMatthew Knepley 
7993bf14a46SMatthew Knepley   ierr = PetscNewLog(B,Mat_Pastix,&pastix);CHKERRQ(ierr);
8003bf14a46SMatthew Knepley   pastix->CleanUpPastix             = PETSC_FALSE;
8013bf14a46SMatthew Knepley   pastix->isAIJ                     = PETSC_TRUE;
8023bf14a46SMatthew Knepley   pastix->scat_rhs                  = PETSC_NULL;
8033bf14a46SMatthew Knepley   pastix->scat_sol                  = PETSC_NULL;
8043bf14a46SMatthew Knepley   pastix->nSolve                    = 0;
8053bf14a46SMatthew Knepley   pastix->MatDestroy                = B->ops->destroy;
8063bf14a46SMatthew Knepley   B->ops->destroy                   = MatDestroy_Pastix;
8073bf14a46SMatthew Knepley   B->spptr                          = (void*)pastix;
8083bf14a46SMatthew Knepley 
8093bf14a46SMatthew Knepley   *F = B;
8103bf14a46SMatthew Knepley   PetscFunctionReturn(0);
8113bf14a46SMatthew Knepley }
8123bf14a46SMatthew Knepley EXTERN_C_END
813