1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 12d71ae5a4SJacob Faibussowitsch { 134099cc6bSBarry Smith PetscBool flg; 144099cc6bSBarry Smith char type[256]; 154099cc6bSBarry Smith 164099cc6bSBarry Smith PetscFunctionBegin; 17d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 189566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 199566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 20d0609cedSBarry Smith PetscOptionsEnd(); 214099cc6bSBarry Smith PetscFunctionReturn(0); 224099cc6bSBarry Smith } 234099cc6bSBarry Smith 24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 25d71ae5a4SJacob Faibussowitsch { 260716a85fSBarry Smith PetscInt i, m, n; 270716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 280716a85fSBarry Smith 290716a85fSBarry Smith PetscFunctionBegin; 309566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 319566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 320716a85fSBarry Smith if (type == NORM_2) { 33ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 340716a85fSBarry Smith } else if (type == NORM_1) { 35ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 360716a85fSBarry Smith } else if (type == NORM_INFINITY) { 37ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 38857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 39ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 40857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 42857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 430716a85fSBarry Smith 440716a85fSBarry Smith if (type == NORM_2) { 45a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 47a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 480716a85fSBarry Smith } 490716a85fSBarry Smith PetscFunctionReturn(0); 500716a85fSBarry Smith } 510716a85fSBarry Smith 52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 53d71ae5a4SJacob Faibussowitsch { 543a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 553a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 563a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 573a062f41SBarry Smith PetscInt *rows; 583a062f41SBarry Smith 593a062f41SBarry Smith PetscFunctionBegin; 603a062f41SBarry Smith for (i = 0; i < m; i++) { 61ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 623a062f41SBarry Smith } 639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 643a062f41SBarry Smith cnt = 0; 653a062f41SBarry Smith for (i = 0; i < m; i++) { 663a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 673a062f41SBarry Smith rows[cnt] = i; 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 723a062f41SBarry Smith PetscFunctionReturn(0); 733a062f41SBarry Smith } 743a062f41SBarry Smith 75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 76d71ae5a4SJacob Faibussowitsch { 776ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 78fff043a9SJunchao Zhang const MatScalar *aa; 796ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 80b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 816ce1633cSBarry Smith PetscInt *rows; 826ce1633cSBarry Smith 836ce1633cSBarry Smith PetscFunctionBegin; 849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 866ce1633cSBarry Smith diag = a->diag; 876ce1633cSBarry Smith for (i = 0; i < m; i++) { 88ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 896ce1633cSBarry Smith } 909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 916ce1633cSBarry Smith cnt = 0; 926ce1633cSBarry Smith for (i = 0; i < m; i++) { 93ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 946ce1633cSBarry Smith } 95f1f41ecbSJed Brown *nrows = cnt; 96f1f41ecbSJed Brown *zrows = rows; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 98f1f41ecbSJed Brown PetscFunctionReturn(0); 99f1f41ecbSJed Brown } 100f1f41ecbSJed Brown 101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 102d71ae5a4SJacob Faibussowitsch { 103f1f41ecbSJed Brown PetscInt nrows, *rows; 104f1f41ecbSJed Brown 105f1f41ecbSJed Brown PetscFunctionBegin; 1060298fd71SBarry Smith *zrows = NULL; 1079566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1089566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1096ce1633cSBarry Smith PetscFunctionReturn(0); 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith 112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 113d71ae5a4SJacob Faibussowitsch { 114b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115b3a44c85SBarry Smith const MatScalar *aa; 116b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 117b3a44c85SBarry Smith const PetscInt *ii; 118b3a44c85SBarry Smith PetscInt n, i, j, *rows; 119b3a44c85SBarry Smith 120b3a44c85SBarry Smith PetscFunctionBegin; 1219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 122f4259b30SLisandro Dalcin *keptrows = NULL; 123b3a44c85SBarry Smith ii = a->i; 124b3a44c85SBarry Smith for (i = 0; i < m; i++) { 125b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 126b3a44c85SBarry Smith if (!n) { 127b3a44c85SBarry Smith cnt++; 128b3a44c85SBarry Smith goto ok1; 129b3a44c85SBarry Smith } 1302e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 131b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 132b3a44c85SBarry Smith } 133b3a44c85SBarry Smith cnt++; 134b3a44c85SBarry Smith ok1:; 135b3a44c85SBarry Smith } 1362e5835c6SStefano Zampini if (!cnt) { 1379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1382e5835c6SStefano Zampini PetscFunctionReturn(0); 1392e5835c6SStefano Zampini } 1409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 141b3a44c85SBarry Smith cnt = 0; 142b3a44c85SBarry Smith for (i = 0; i < m; i++) { 143b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 144b3a44c85SBarry Smith if (!n) continue; 1452e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 146b3a44c85SBarry Smith if (aa[j] != 0.0) { 147b3a44c85SBarry Smith rows[cnt++] = i; 148b3a44c85SBarry Smith break; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith } 151b3a44c85SBarry Smith } 1529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1539566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 154b3a44c85SBarry Smith PetscFunctionReturn(0); 155b3a44c85SBarry Smith } 156b3a44c85SBarry Smith 157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 158d71ae5a4SJacob Faibussowitsch { 15979299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16099e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16199e65526SBarry Smith const PetscInt *diag; 1622e5835c6SStefano Zampini MatScalar *aa; 16399e65526SBarry Smith const PetscScalar *v; 164ace3abfcSBarry Smith PetscBool missing; 16579299369SBarry Smith 16679299369SBarry Smith PetscFunctionBegin; 16709f38230SBarry Smith if (Y->assembled) { 1689566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 16909f38230SBarry Smith if (!missing) { 17079299369SBarry Smith diag = aij->diag; 1719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 17379299369SBarry Smith if (is == INSERT_VALUES) { 174ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 17579299369SBarry Smith } else { 176ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 17779299369SBarry Smith } 1789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 18079299369SBarry Smith PetscFunctionReturn(0); 18179299369SBarry Smith } 1829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 18309f38230SBarry Smith } 1849566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 18509f38230SBarry Smith PetscFunctionReturn(0); 18609f38230SBarry Smith } 18779299369SBarry Smith 188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 189d71ae5a4SJacob Faibussowitsch { 190416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19197f1f81fSBarry Smith PetscInt i, ishift; 19217ab2063SBarry Smith 1933a40ed3dSBarry Smith PetscFunctionBegin; 194f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 1953a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 196bfeeae90SHong Zhang ishift = 0; 197b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 1989566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 199bfeeae90SHong Zhang } else if (oshift == 1) { 2001a83f524SJed Brown PetscInt *tia; 201d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2023b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2041a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2051a83f524SJed Brown *ia = tia; 206ecc77c7aSBarry Smith if (ja) { 2071a83f524SJed Brown PetscInt *tja; 2089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2091a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2101a83f524SJed Brown *ja = tja; 211ecc77c7aSBarry Smith } 2126945ee14SBarry Smith } else { 213ecc77c7aSBarry Smith *ia = a->i; 214ecc77c7aSBarry Smith if (ja) *ja = a->j; 215a2ce50c7SBarry Smith } 2163a40ed3dSBarry Smith PetscFunctionReturn(0); 217a2744918SBarry Smith } 218a2744918SBarry Smith 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 220d71ae5a4SJacob Faibussowitsch { 2213a40ed3dSBarry Smith PetscFunctionBegin; 2223a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 223b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2249566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2259566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 226bcd2baecSBarry Smith } 2273a40ed3dSBarry Smith PetscFunctionReturn(0); 22817ab2063SBarry Smith } 22917ab2063SBarry Smith 230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 231d71ae5a4SJacob Faibussowitsch { 2323b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 233d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 23497f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2353b2fbd54SBarry Smith 2363a40ed3dSBarry Smith PetscFunctionBegin; 237899cda47SBarry Smith *nn = n; 2383a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2393b2fbd54SBarry Smith if (symmetric) { 2409566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2413b2fbd54SBarry Smith } else { 2429566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2453b2fbd54SBarry Smith jj = a->j; 246ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2473b2fbd54SBarry Smith cia[0] = oshift; 248ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2503b2fbd54SBarry Smith jj = a->j; 251a93ec695SBarry Smith for (row = 0; row < m; row++) { 252a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 253a93ec695SBarry Smith for (i = 0; i < mr; i++) { 254bfeeae90SHong Zhang col = *jj++; 2552205254eSKarl Rupp 2563b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2573b2fbd54SBarry Smith } 2583b2fbd54SBarry Smith } 2599566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2609371c9d4SSatish Balay *ia = cia; 2619371c9d4SSatish Balay *ja = cja; 2623b2fbd54SBarry Smith } 2633a40ed3dSBarry Smith PetscFunctionReturn(0); 2643b2fbd54SBarry Smith } 2653b2fbd54SBarry Smith 266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 267d71ae5a4SJacob Faibussowitsch { 2683a40ed3dSBarry Smith PetscFunctionBegin; 2693a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2703b2fbd54SBarry Smith 2719566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2729566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2733a40ed3dSBarry Smith PetscFunctionReturn(0); 2743b2fbd54SBarry Smith } 2753b2fbd54SBarry Smith 2767cee066cSHong Zhang /* 2777cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2787cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 279040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2807cee066cSHong Zhang */ 281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 282d71ae5a4SJacob Faibussowitsch { 2837cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2847cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 285071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2867cee066cSHong Zhang PetscInt *cspidx; 287071fcb05SBarry Smith const PetscInt *jj; 2887cee066cSHong Zhang 2897cee066cSHong Zhang PetscFunctionBegin; 2907cee066cSHong Zhang *nn = n; 2917cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 292625f6d37SHong Zhang 2939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 2977cee066cSHong Zhang jj = a->j; 298ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2997cee066cSHong Zhang cia[0] = oshift; 300ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3027cee066cSHong Zhang jj = a->j; 3037cee066cSHong Zhang for (row = 0; row < m; row++) { 3047cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3057cee066cSHong Zhang for (i = 0; i < mr; i++) { 3067cee066cSHong Zhang col = *jj++; 307071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 308071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 309071fcb05SBarry Smith cja[tmp] = row + oshift; 3107cee066cSHong Zhang } 3117cee066cSHong Zhang } 3129566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 313071fcb05SBarry Smith *ia = cia; 314071fcb05SBarry Smith *ja = cja; 3157cee066cSHong Zhang *spidx = cspidx; 3167cee066cSHong Zhang PetscFunctionReturn(0); 3177cee066cSHong Zhang } 3187cee066cSHong Zhang 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 320d71ae5a4SJacob Faibussowitsch { 3217cee066cSHong Zhang PetscFunctionBegin; 3229566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3239566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3247cee066cSHong Zhang PetscFunctionReturn(0); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 328d71ae5a4SJacob Faibussowitsch { 32987d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33087d4246cSBarry Smith PetscInt *ai = a->i; 331fff043a9SJunchao Zhang PetscScalar *aa; 33287d4246cSBarry Smith 33387d4246cSBarry Smith PetscFunctionBegin; 3349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 33787d4246cSBarry Smith PetscFunctionReturn(0); 33887d4246cSBarry Smith } 33987d4246cSBarry Smith 340bd04181cSBarry Smith /* 341bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 342bd04181cSBarry Smith 343bd04181cSBarry Smith - a single row of values is set with each call 344bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 345bd04181cSBarry Smith - the values are always added to the matrix, not set 346bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 347bd04181cSBarry Smith 3481f763a69SBarry Smith This does NOT assume the global column indices are sorted 349bd04181cSBarry Smith 3501f763a69SBarry Smith */ 351bd04181cSBarry Smith 352af0996ceSBarry Smith #include <petsc/private/isimpl.h> 353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 354d71ae5a4SJacob Faibussowitsch { 355189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3561f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3571f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3581f763a69SBarry Smith PetscInt lastcol = -1; 359fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 360189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 361189e4007SBarry Smith 362fff043a9SJunchao Zhang PetscFunctionBegin; 3639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 364f38dd0b8SBarry Smith row = ridx[im[0]]; 3651f763a69SBarry Smith rp = aj + ai[row]; 3661f763a69SBarry Smith ap = aa + ai[row]; 3671f763a69SBarry Smith nrow = ailen[row]; 368189e4007SBarry Smith low = 0; 369189e4007SBarry Smith high = nrow; 370189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 371189e4007SBarry Smith col = cidx[in[l]]; 372f38dd0b8SBarry Smith value = v[l]; 373189e4007SBarry Smith 374189e4007SBarry Smith if (col <= lastcol) low = 0; 375189e4007SBarry Smith else high = nrow; 376189e4007SBarry Smith lastcol = col; 377189e4007SBarry Smith while (high - low > 5) { 378189e4007SBarry Smith t = (low + high) / 2; 379189e4007SBarry Smith if (rp[t] > col) high = t; 380189e4007SBarry Smith else low = t; 381189e4007SBarry Smith } 382189e4007SBarry Smith for (i = low; i < high; i++) { 383189e4007SBarry Smith if (rp[i] == col) { 3841f763a69SBarry Smith ap[i] += value; 385189e4007SBarry Smith low = i + 1; 3861f763a69SBarry Smith break; 387189e4007SBarry Smith } 388189e4007SBarry Smith } 389189e4007SBarry Smith } 3909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 391f38dd0b8SBarry Smith return 0; 392189e4007SBarry Smith } 393189e4007SBarry Smith 394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 395d71ae5a4SJacob Faibussowitsch { 396416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 397e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 39897f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 399e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 400ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 401ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 402ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 40317ab2063SBarry Smith 4043a40ed3dSBarry Smith PetscFunctionBegin; 4059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 40617ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 407416022c9SBarry Smith row = im[k]; 4085ef9f2a5SBarry Smith if (row < 0) continue; 4096bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 410720833daSHong Zhang rp = aj + ai[row]; 411876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4129371c9d4SSatish Balay rmax = imax[row]; 4139371c9d4SSatish Balay nrow = ailen[row]; 414416022c9SBarry Smith low = 0; 415c71e6ed7SBarry Smith high = nrow; 41617ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4175ef9f2a5SBarry Smith if (in[l] < 0) continue; 4186bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 419bfeeae90SHong Zhang col = in[l]; 420071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 421071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 42236db0b34SBarry Smith 4232205254eSKarl Rupp if (col <= lastcol) low = 0; 4242205254eSKarl Rupp else high = nrow; 425e2ee6c50SBarry Smith lastcol = col; 426416022c9SBarry Smith while (high - low > 5) { 427416022c9SBarry Smith t = (low + high) / 2; 428416022c9SBarry Smith if (rp[t] > col) high = t; 429416022c9SBarry Smith else low = t; 43017ab2063SBarry Smith } 431416022c9SBarry Smith for (i = low; i < high; i++) { 43217ab2063SBarry Smith if (rp[i] > col) break; 43317ab2063SBarry Smith if (rp[i] == col) { 434876c6284SHong Zhang if (!A->structure_only) { 4350c0d7e18SFande Kong if (is == ADD_VALUES) { 4360c0d7e18SFande Kong ap[i] += value; 4370c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4389371c9d4SSatish Balay } else ap[i] = value; 439720833daSHong Zhang } 440e44c0bd4SBarry Smith low = i + 1; 44117ab2063SBarry Smith goto noinsert; 44217ab2063SBarry Smith } 44317ab2063SBarry Smith } 444dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 445c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 44608401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 447720833daSHong Zhang if (A->structure_only) { 448876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 449720833daSHong Zhang } else { 450fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 451720833daSHong Zhang } 4529371c9d4SSatish Balay N = nrow++ - 1; 4539371c9d4SSatish Balay a->nz++; 4549371c9d4SSatish Balay high++; 455416022c9SBarry Smith /* shift up all the later entries in this row */ 4569566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 45717ab2063SBarry Smith rp[i] = col; 458580bdb30SBarry Smith if (!A->structure_only) { 4599566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 460580bdb30SBarry Smith ap[i] = value; 461580bdb30SBarry Smith } 462416022c9SBarry Smith low = i + 1; 463e56f5c9eSBarry Smith A->nonzerostate++; 464e44c0bd4SBarry Smith noinsert:; 46517ab2063SBarry Smith } 46617ab2063SBarry Smith ailen[row] = nrow; 46717ab2063SBarry Smith } 4689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4693a40ed3dSBarry Smith PetscFunctionReturn(0); 47017ab2063SBarry Smith } 47117ab2063SBarry Smith 472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 473d71ae5a4SJacob Faibussowitsch { 47419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 47519b08ed1SBarry Smith PetscInt *rp, k, row; 47619b08ed1SBarry Smith PetscInt *ai = a->i; 47719b08ed1SBarry Smith PetscInt *aj = a->j; 478fff043a9SJunchao Zhang MatScalar *aa, *ap; 47919b08ed1SBarry Smith 48019b08ed1SBarry Smith PetscFunctionBegin; 48128b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48208401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 483fff043a9SJunchao Zhang 4849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 48519b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 48619b08ed1SBarry Smith row = im[k]; 48719b08ed1SBarry Smith rp = aj + ai[row]; 48819b08ed1SBarry Smith ap = aa + ai[row]; 48919b08ed1SBarry Smith 4909566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49119b08ed1SBarry Smith if (!A->structure_only) { 49219b08ed1SBarry Smith if (v) { 4939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 49419b08ed1SBarry Smith v += n; 49519b08ed1SBarry Smith } else { 4969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 49719b08ed1SBarry Smith } 49819b08ed1SBarry Smith } 49919b08ed1SBarry Smith a->ilen[row] = n; 50019b08ed1SBarry Smith a->imax[row] = n; 50119b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50219b08ed1SBarry Smith a->nz += n; 50319b08ed1SBarry Smith } 5049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 50519b08ed1SBarry Smith PetscFunctionReturn(0); 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith 50819b08ed1SBarry Smith /*@ 50919b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51019b08ed1SBarry Smith 51119b08ed1SBarry Smith Input Parameters: 51211a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 51319b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith Level: advanced 51619b08ed1SBarry Smith 51719b08ed1SBarry Smith Notes: 51819b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 51911a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52019b08ed1SBarry Smith as always with multiple matrix assemblies. 52119b08ed1SBarry Smith 522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 52319b08ed1SBarry Smith @*/ 52419b08ed1SBarry Smith 525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 526d71ae5a4SJacob Faibussowitsch { 52719b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 52819b08ed1SBarry Smith 52919b08ed1SBarry Smith PetscFunctionBegin; 5309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53219b08ed1SBarry Smith a->maxnz = nztotal; 5334dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 53419b08ed1SBarry Smith if (!a->ilen) { 5359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 53619b08ed1SBarry Smith } else { 5379566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 53819b08ed1SBarry Smith } 53919b08ed1SBarry Smith 54019b08ed1SBarry Smith /* allocate the matrix space */ 54119b08ed1SBarry Smith if (A->structure_only) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith a->i[0] = 0; 54819b08ed1SBarry Smith if (A->structure_only) { 54919b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55019b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55119b08ed1SBarry Smith } else { 55219b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55319b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 55619b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55719b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 55819b08ed1SBarry Smith PetscFunctionReturn(0); 55919b08ed1SBarry Smith } 56019b08ed1SBarry Smith 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 562d71ae5a4SJacob Faibussowitsch { 563071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564071fcb05SBarry Smith PetscInt *rp, k, row; 565071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 566071fcb05SBarry Smith PetscInt *aj = a->j; 567fff043a9SJunchao Zhang MatScalar *aa, *ap; 568071fcb05SBarry Smith 569071fcb05SBarry Smith PetscFunctionBegin; 5709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 571071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 572071fcb05SBarry Smith row = im[k]; 5736bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 574071fcb05SBarry Smith rp = aj + ai[row]; 575071fcb05SBarry Smith ap = aa + ai[row]; 57648a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 577071fcb05SBarry Smith if (!A->structure_only) { 578071fcb05SBarry Smith if (v) { 5799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 580071fcb05SBarry Smith v += n; 581071fcb05SBarry Smith } else { 5829566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 583071fcb05SBarry Smith } 584071fcb05SBarry Smith } 585071fcb05SBarry Smith ailen[row] = n; 586071fcb05SBarry Smith a->nz += n; 587071fcb05SBarry Smith } 5889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 589071fcb05SBarry Smith PetscFunctionReturn(0); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith 592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 593d71ae5a4SJacob Faibussowitsch { 5947eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59597f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59697f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 597fff043a9SJunchao Zhang MatScalar *ap, *aa; 5987eb43aa7SLois Curfman McInnes 5993a40ed3dSBarry Smith PetscFunctionBegin; 6009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 6017eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6027eb43aa7SLois Curfman McInnes row = im[k]; 6039371c9d4SSatish Balay if (row < 0) { 6049371c9d4SSatish Balay v += n; 6059371c9d4SSatish Balay continue; 6069371c9d4SSatish Balay } /* negative row */ 60754c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6089371c9d4SSatish Balay rp = aj + ai[row]; 6099371c9d4SSatish Balay ap = aa + ai[row]; 6107eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6117eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6129371c9d4SSatish Balay if (in[l] < 0) { 6139371c9d4SSatish Balay v++; 6149371c9d4SSatish Balay continue; 6159371c9d4SSatish Balay } /* negative column */ 61654c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 617bfeeae90SHong Zhang col = in[l]; 6189371c9d4SSatish Balay high = nrow; 6199371c9d4SSatish Balay low = 0; /* assume unsorted */ 6207eb43aa7SLois Curfman McInnes while (high - low > 5) { 6217eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6227eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6237eb43aa7SLois Curfman McInnes else low = t; 6247eb43aa7SLois Curfman McInnes } 6257eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6267eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6277eb43aa7SLois Curfman McInnes if (rp[i] == col) { 628b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6297eb43aa7SLois Curfman McInnes goto finished; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes } 63297e567efSBarry Smith *v++ = 0.0; 6337eb43aa7SLois Curfman McInnes finished:; 6347eb43aa7SLois Curfman McInnes } 6357eb43aa7SLois Curfman McInnes } 6369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 6373a40ed3dSBarry Smith PetscFunctionReturn(0); 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 641d71ae5a4SJacob Faibussowitsch { 6423ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 643c898d852SStefano Zampini const PetscScalar *av; 6443ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6453ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64617ab2063SBarry Smith 6473a40ed3dSBarry Smith PetscFunctionBegin; 6489566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6492205254eSKarl Rupp 6503ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6513ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6523ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6533ea6fe3dSLisandro Dalcin nz = A->nz; 654416022c9SBarry Smith 6553ea6fe3dSLisandro Dalcin /* write matrix header */ 6563ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6579371c9d4SSatish Balay header[1] = M; 6589371c9d4SSatish Balay header[2] = N; 6599371c9d4SSatish Balay header[3] = nz; 6609566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6643ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6659566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6669566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6673ea6fe3dSLisandro Dalcin /* store column indices */ 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 669416022c9SBarry Smith /* store nonzero values */ 6709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 673b37d52dbSMark F. Adams 6743ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6759566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6763a40ed3dSBarry Smith PetscFunctionReturn(0); 67717ab2063SBarry Smith } 678416022c9SBarry Smith 679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 680d71ae5a4SJacob Faibussowitsch { 6817dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6827dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6837dc0baabSHong Zhang 6847dc0baabSHong Zhang PetscFunctionBegin; 6859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6867dc0baabSHong Zhang for (i = 0; i < m; i++) { 6879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68848a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6907dc0baabSHong Zhang } 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6927dc0baabSHong Zhang PetscFunctionReturn(0); 6937dc0baabSHong Zhang } 6947dc0baabSHong Zhang 69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 696cd155464SBarry Smith 697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 698d71ae5a4SJacob Faibussowitsch { 699416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 700c898d852SStefano Zampini const PetscScalar *av; 70160e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 702e060cb09SBarry Smith const char *name; 703f3ef73ceSBarry Smith PetscViewerFormat format; 70417ab2063SBarry Smith 7053a40ed3dSBarry Smith PetscFunctionBegin; 7067dc0baabSHong Zhang if (A->structure_only) { 7079566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7087dc0baabSHong Zhang PetscFunctionReturn(0); 7097dc0baabSHong Zhang } 71043e49210SHong Zhang 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7122e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7132e5835c6SStefano Zampini 714c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 71897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 71960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 720c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 721d00d2cf4SBarry Smith nofinalvalue = 1; 722d00d2cf4SBarry Smith } 7239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 728fbfe6fa7SJed Brown #else 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #endif 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73217ab2063SBarry Smith 73317ab2063SBarry Smith for (i = 0; i < m; i++) { 73460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73717ab2063SBarry Smith #else 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 73917ab2063SBarry Smith #endif 74017ab2063SBarry Smith } 74117ab2063SBarry Smith } 742d00d2cf4SBarry Smith if (nofinalvalue) { 743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 745c337ccceSJed Brown #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 747c337ccceSJed Brown #endif 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 752fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75444cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 75836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76036db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7646831982aSBarry Smith } 76544cd7ae7SLois Curfman McInnes #else 7669566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76744cd7ae7SLois Curfman McInnes #endif 76844cd7ae7SLois Curfman McInnes } 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 772fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77397f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 776496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 777496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 77860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 779496be53dSLois Curfman McInnes if (a->j[j] >= i) { 780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 782496be53dSLois Curfman McInnes #else 783496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 784496be53dSLois Curfman McInnes #endif 785496be53dSLois Curfman McInnes } 786496be53dSLois Curfman McInnes } 787496be53dSLois Curfman McInnes } 7882e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7902e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7912205254eSKarl Rupp if (i + 4 < m) { 7929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7932205254eSKarl Rupp } else if (i + 3 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7952205254eSKarl Rupp } else if (i + 2 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7972205254eSKarl Rupp } else if (i + 1 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 7992205254eSKarl Rupp } else if (i < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8012205254eSKarl Rupp } else { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8032205254eSKarl Rupp } 804496be53dSLois Curfman McInnes } 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8069566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 807496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 80860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8099566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 816496be53dSLois Curfman McInnes if (a->j[j] >= i) { 817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 81848a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 819496be53dSLois Curfman McInnes #else 8209566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 821496be53dSLois Curfman McInnes #endif 822496be53dSLois Curfman McInnes } 823496be53dSLois Curfman McInnes } 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 827fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 82897f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 82987828ca2SBarry Smith PetscScalar value; 83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83168f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83268f1ed48SBarry Smith 83368f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83468f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83568f1ed48SBarry Smith realonly = PETSC_FALSE; 83668f1ed48SBarry Smith break; 83768f1ed48SBarry Smith } 83868f1ed48SBarry Smith } 83968f1ed48SBarry Smith #endif 84002594712SBarry Smith 8419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84202594712SBarry Smith for (i = 0; i < m; i++) { 84302594712SBarry Smith jcnt = 0; 844d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 845e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84602594712SBarry Smith value = a->a[cnt++]; 847e24b481bSBarry Smith jcnt++; 84802594712SBarry Smith } else { 84902594712SBarry Smith value = 0.0; 85002594712SBarry Smith } 851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85268f1ed48SBarry Smith if (realonly) { 8539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85468f1ed48SBarry Smith } else { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85668f1ed48SBarry Smith } 85702594712SBarry Smith #else 8589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 85902594712SBarry Smith #endif 86002594712SBarry Smith } 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8643c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 865150b93efSMatthew G. Knepley PetscInt fshift = 1; 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8693c215bfdSMatthew Knepley #else 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8713c215bfdSMatthew Knepley #endif 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8733c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8793c215bfdSMatthew Knepley #endif 8803c215bfdSMatthew Knepley } 8813c215bfdSMatthew Knepley } 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8833a40ed3dSBarry Smith } else { 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 885d5f3da31SBarry Smith if (A->factortype) { 88616cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 88816cd7e1dSShri Abhyankar /* L part */ 88960e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89516cd7e1dSShri Abhyankar } else { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89716cd7e1dSShri Abhyankar } 89816cd7e1dSShri Abhyankar #else 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90016cd7e1dSShri Abhyankar #endif 90116cd7e1dSShri Abhyankar } 90216cd7e1dSShri Abhyankar /* diagonal */ 90316cd7e1dSShri Abhyankar j = a->diag[i]; 90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 90916cd7e1dSShri Abhyankar } else { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91116cd7e1dSShri Abhyankar } 91216cd7e1dSShri Abhyankar #else 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar #endif 91516cd7e1dSShri Abhyankar 91616cd7e1dSShri Abhyankar /* U part */ 91760e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar } else { 93317ab2063SBarry Smith for (i = 0; i < m; i++) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 93936db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9413a40ed3dSBarry Smith } else { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94317ab2063SBarry Smith } 94417ab2063SBarry Smith #else 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94617ab2063SBarry Smith #endif 94717ab2063SBarry Smith } 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 94917ab2063SBarry Smith } 95016cd7e1dSShri Abhyankar } 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95217ab2063SBarry Smith } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9543a40ed3dSBarry Smith PetscFunctionReturn(0); 955416022c9SBarry Smith } 956416022c9SBarry Smith 9579804daf3SBarry Smith #include <petscdraw.h> 958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 959d71ae5a4SJacob Faibussowitsch { 960480ef9eaSBarry Smith Mat A = (Mat)Aa; 961416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 962383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 963383922c3SLisandro Dalcin int color; 964b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 965b0a32e0cSBarry Smith PetscViewer viewer; 966f3ef73ceSBarry Smith PetscViewerFormat format; 967fff043a9SJunchao Zhang const PetscScalar *aa; 968cddf8d76SBarry Smith 9693a40ed3dSBarry Smith PetscFunctionBegin; 9709566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9719566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 973383922c3SLisandro Dalcin 974416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 976fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 977d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9780513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 979b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 980416022c9SBarry Smith for (i = 0; i < m; i++) { 9819371c9d4SSatish Balay y_l = m - i - 1.0; 9829371c9d4SSatish Balay y_r = y_l + 1.0; 983bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9849371c9d4SSatish Balay x_l = a->j[j]; 9859371c9d4SSatish Balay x_r = x_l + 1.0; 986fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9879566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 988cddf8d76SBarry Smith } 989cddf8d76SBarry Smith } 990b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 991cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9929371c9d4SSatish Balay y_l = m - i - 1.0; 9939371c9d4SSatish Balay y_r = y_l + 1.0; 994bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9959371c9d4SSatish Balay x_l = a->j[j]; 9969371c9d4SSatish Balay x_r = x_l + 1.0; 997fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 9989566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 999cddf8d76SBarry Smith } 1000cddf8d76SBarry Smith } 1001b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1002cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10039371c9d4SSatish Balay y_l = m - i - 1.0; 10049371c9d4SSatish Balay y_r = y_l + 1.0; 1005bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10069371c9d4SSatish Balay x_l = a->j[j]; 10079371c9d4SSatish Balay x_r = x_l + 1.0; 1008fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10099566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1010416022c9SBarry Smith } 1011416022c9SBarry Smith } 1012d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10130513a670SBarry Smith } else { 10140513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10150513a670SBarry Smith /* first determine max of all nonzero values */ 1016b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1017383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1018b0a32e0cSBarry Smith PetscDraw popup; 10190513a670SBarry Smith 10200513a670SBarry Smith for (i = 0; i < nz; i++) { 1021fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10220513a670SBarry Smith } 1023383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10249566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10259566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1026383922c3SLisandro Dalcin 1027d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10280513a670SBarry Smith for (i = 0; i < m; i++) { 1029383922c3SLisandro Dalcin y_l = m - i - 1.0; 1030383922c3SLisandro Dalcin y_r = y_l + 1.0; 1031bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1032383922c3SLisandro Dalcin x_l = a->j[j]; 1033383922c3SLisandro Dalcin x_r = x_l + 1.0; 1034fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10359566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10360513a670SBarry Smith count++; 10370513a670SBarry Smith } 10380513a670SBarry Smith } 1039d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10400513a670SBarry Smith } 10419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1042480ef9eaSBarry Smith PetscFunctionReturn(0); 1043480ef9eaSBarry Smith } 1044cddf8d76SBarry Smith 10459804daf3SBarry Smith #include <petscdraw.h> 1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1047d71ae5a4SJacob Faibussowitsch { 1048b0a32e0cSBarry Smith PetscDraw draw; 104936db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1050ace3abfcSBarry Smith PetscBool isnull; 1051480ef9eaSBarry Smith 1052480ef9eaSBarry Smith PetscFunctionBegin; 10539566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10549566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 1055480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1056480ef9eaSBarry Smith 10579371c9d4SSatish Balay xr = A->cmap->n; 10589371c9d4SSatish Balay yr = A->rmap->n; 10599371c9d4SSatish Balay h = yr / 10.0; 10609371c9d4SSatish Balay w = xr / 10.0; 10619371c9d4SSatish Balay xr += w; 10629371c9d4SSatish Balay yr += h; 10639371c9d4SSatish Balay xl = -w; 10649371c9d4SSatish Balay yl = -h; 10659566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10669566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10703a40ed3dSBarry Smith PetscFunctionReturn(0); 1071416022c9SBarry Smith } 1072416022c9SBarry Smith 1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1074d71ae5a4SJacob Faibussowitsch { 1075ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1076416022c9SBarry Smith 10773a40ed3dSBarry Smith PetscFunctionBegin; 10789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10799566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10811baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10821baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10831baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10849566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10853a40ed3dSBarry Smith PetscFunctionReturn(0); 108617ab2063SBarry Smith } 108719bcc07fSBarry Smith 1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1089d71ae5a4SJacob Faibussowitsch { 1090416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1091580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1092d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 109354f21887SBarry Smith MatScalar *aa = a->a, *ap; 10943447b6efSHong Zhang PetscReal ratio = 0.6; 109517ab2063SBarry Smith 10963a40ed3dSBarry Smith PetscFunctionBegin; 10973a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 10989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1099b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1100b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11019566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 1102b215bc84SStefano Zampini PetscFunctionReturn(0); 1103b215bc84SStefano Zampini } 110417ab2063SBarry Smith 110543ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110617ab2063SBarry Smith for (i = 1; i < m; i++) { 1107416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 110817ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 110994a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111017ab2063SBarry Smith if (fshift) { 1111bfeeae90SHong Zhang ip = aj + ai[i]; 1112bfeeae90SHong Zhang ap = aa + ai[i]; 111317ab2063SBarry Smith N = ailen[i]; 11149566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111617ab2063SBarry Smith } 111717ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 111817ab2063SBarry Smith } 111917ab2063SBarry Smith if (m) { 112017ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112117ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112217ab2063SBarry Smith } 112317ab2063SBarry Smith /* reset ilen and imax for each row */ 11247b083b7cSBarry Smith a->nonzerorowcnt = 0; 1125396832f4SHong Zhang if (A->structure_only) { 11269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1128396832f4SHong Zhang } else { /* !A->structure_only */ 112917ab2063SBarry Smith for (i = 0; i < m; i++) { 113017ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11317b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113217ab2063SBarry Smith } 1133396832f4SHong Zhang } 1134bfeeae90SHong Zhang a->nz = ai[m]; 1135aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 113617ab2063SBarry Smith 11379566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11389566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11399566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11412205254eSKarl Rupp 11428e58a170SBarry Smith A->info.mallocs += a->reallocs; 1143dd5f02e7SSatish Balay a->reallocs = 0; 11446712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 114536db0b34SBarry Smith a->rmax = rmax; 11464e220ebcSLois Curfman McInnes 114748a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11489566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11493a40ed3dSBarry Smith PetscFunctionReturn(0); 115017ab2063SBarry Smith } 115117ab2063SBarry Smith 1152d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1153d71ae5a4SJacob Faibussowitsch { 115499cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 115599cafbc1SBarry Smith PetscInt i, nz = a->nz; 11562e5835c6SStefano Zampini MatScalar *aa; 115799cafbc1SBarry Smith 115899cafbc1SBarry Smith PetscFunctionBegin; 11599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 116399cafbc1SBarry Smith PetscFunctionReturn(0); 116499cafbc1SBarry Smith } 116599cafbc1SBarry Smith 1166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 117799cafbc1SBarry Smith PetscFunctionReturn(0); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 1182fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1183fff043a9SJunchao Zhang MatScalar *aa; 11843a40ed3dSBarry Smith 11853a40ed3dSBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11903a40ed3dSBarry Smith PetscFunctionReturn(0); 119117ab2063SBarry Smith } 1192416022c9SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1194d71ae5a4SJacob Faibussowitsch { 1195cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1196cbc6b225SStefano Zampini 1197cbc6b225SStefano Zampini PetscFunctionBegin; 11989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1200cbc6b225SStefano Zampini PetscFunctionReturn(0); 1201cbc6b225SStefano Zampini } 1202cbc6b225SStefano Zampini 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1204d71ae5a4SJacob Faibussowitsch { 1205416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1206d5d45c9bSBarry Smith 12073a40ed3dSBarry Smith PetscFunctionBegin; 1208aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1209c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz); 121017ab2063SBarry Smith #endif 12119566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12129566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12139566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12149566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12159566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12169566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12179566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12259566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1227901853e0SKris Buschelman 12286718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12296718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12306718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12316718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12326718818eSStefano Zampini due to different matrix sizes */ 12339566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12346718818eSStefano Zampini 12359566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12362e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12372e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12452e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12462e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12472e956fe4SStefano Zampini #endif 12484222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12524222ddf1SHong Zhang #endif 12533d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12553d0639e7SStefano Zampini #endif 12569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1257af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1259af8000cdSHong Zhang #endif 1260d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1262d24d4204SJose E. Roman #endif 126363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 126663c07aadSStefano Zampini #endif 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12712e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12822e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12832e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12872e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12882e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12893a40ed3dSBarry Smith PetscFunctionReturn(0); 129017ab2063SBarry Smith } 129117ab2063SBarry Smith 1292d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1293d71ae5a4SJacob Faibussowitsch { 1294416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 12953a40ed3dSBarry Smith 12963a40ed3dSBarry Smith PetscFunctionBegin; 1297a65d3064SKris Buschelman switch (op) { 1298d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1299d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1300d71ae5a4SJacob Faibussowitsch break; 1301d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1302d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1303d71ae5a4SJacob Faibussowitsch break; 1304d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1305d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1306d71ae5a4SJacob Faibussowitsch break; 1307d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1308d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1309d71ae5a4SJacob Faibussowitsch break; 1310d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1311d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1312d71ae5a4SJacob Faibussowitsch break; 1313d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1314d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1315d71ae5a4SJacob Faibussowitsch break; 1316d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1317d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1318d71ae5a4SJacob Faibussowitsch break; 13193d472b54SHong Zhang case MAT_SPD: 1320b1646e73SJed Brown case MAT_SYMMETRIC: 1321b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1322b1646e73SJed Brown case MAT_HERMITIAN: 1323b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1324957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1325b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1326b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1327b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13285021d80fSJed Brown break; 13298c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1330a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1331d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1332d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1333d71ae5a4SJacob Faibussowitsch break; 1334d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1335d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1336d71ae5a4SJacob Faibussowitsch break; 1337d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1338d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1339d71ae5a4SJacob Faibussowitsch break; 1340071fcb05SBarry Smith case MAT_SORTED_FULL: 1341071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1342071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1343071fcb05SBarry Smith break; 1344d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1345d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch default: 1348d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1349a65d3064SKris Buschelman } 13503a40ed3dSBarry Smith PetscFunctionReturn(0); 135117ab2063SBarry Smith } 135217ab2063SBarry Smith 1353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1354d71ae5a4SJacob Faibussowitsch { 1355416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1356fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1357c898d852SStefano Zampini PetscScalar *x; 1358c898d852SStefano Zampini const PetscScalar *aa; 135917ab2063SBarry Smith 13603a40ed3dSBarry Smith PetscFunctionBegin; 13619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 136208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1364d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1365d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13669566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13672c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 137035e7444dSHong Zhang PetscFunctionReturn(0); 137135e7444dSHong Zhang } 137235e7444dSHong Zhang 13739566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 137435e7444dSHong Zhang for (i = 0; i < n; i++) { 1375fdc842d1SBarry Smith x[i] = 0.0; 137635e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 137735e7444dSHong Zhang if (aj[j] == i) { 137835e7444dSHong Zhang x[i] = aa[j]; 137917ab2063SBarry Smith break; 138017ab2063SBarry Smith } 138117ab2063SBarry Smith } 138217ab2063SBarry Smith } 13839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13853a40ed3dSBarry Smith PetscFunctionReturn(0); 138617ab2063SBarry Smith } 138717ab2063SBarry Smith 1388c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1389d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1390d71ae5a4SJacob Faibussowitsch { 1391416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13925f22a7b3SSebastian Grimberg const MatScalar *aa; 1393d9ca1df4SBarry Smith PetscScalar *y; 1394d9ca1df4SBarry Smith const PetscScalar *x; 1395d0f46423SBarry Smith PetscInt m = A->rmap->n; 13965c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 13975f22a7b3SSebastian Grimberg const MatScalar *v; 1398a77337e4SBarry Smith PetscScalar alpha; 1399d9ca1df4SBarry Smith PetscInt n, i, j; 1400d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14013447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1402ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14035c897100SBarry Smith #endif 140417ab2063SBarry Smith 14053a40ed3dSBarry Smith PetscFunctionBegin; 14069566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14089566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14105c897100SBarry Smith 14115c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1412fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14135c897100SBarry Smith #else 14143447b6efSHong Zhang if (usecprow) { 14153447b6efSHong Zhang m = cprow.nrows; 14163447b6efSHong Zhang ii = cprow.i; 14177b2bb3b9SHong Zhang ridx = cprow.rindex; 14183447b6efSHong Zhang } else { 14193447b6efSHong Zhang ii = a->i; 14203447b6efSHong Zhang } 142117ab2063SBarry Smith for (i = 0; i < m; i++) { 14223447b6efSHong Zhang idx = a->j + ii[i]; 1423fff043a9SJunchao Zhang v = aa + ii[i]; 14243447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14253447b6efSHong Zhang if (usecprow) { 14267b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14273447b6efSHong Zhang } else { 142817ab2063SBarry Smith alpha = x[i]; 14293447b6efSHong Zhang } 143004fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143117ab2063SBarry Smith } 14325c897100SBarry Smith #endif 14339566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14349566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14359566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14373a40ed3dSBarry Smith PetscFunctionReturn(0); 143817ab2063SBarry Smith } 143917ab2063SBarry Smith 1440d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1441d71ae5a4SJacob Faibussowitsch { 14425c897100SBarry Smith PetscFunctionBegin; 14439566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14449566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14455c897100SBarry Smith PetscFunctionReturn(0); 14465c897100SBarry Smith } 14475c897100SBarry Smith 1448c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 144978b84d54SShri Abhyankar 1450d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1451d71ae5a4SJacob Faibussowitsch { 1452416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1453d9fead3dSBarry Smith PetscScalar *y; 145454f21887SBarry Smith const PetscScalar *x; 1455fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1456003131ecSBarry Smith PetscInt m = A->rmap->n; 14570298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14587b083b7cSBarry Smith PetscInt n, i; 1459362ced78SSatish Balay PetscScalar sum; 1460ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146117ab2063SBarry Smith 1462b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146397952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1464fee21e36SBarry Smith #endif 1465fee21e36SBarry Smith 14663a40ed3dSBarry Smith PetscFunctionBegin; 1467b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14689566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 1469b215bc84SStefano Zampini PetscFunctionReturn(0); 1470b215bc84SStefano Zampini } 14719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14729566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14739566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1474416022c9SBarry Smith ii = a->i; 14754eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14769566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 147797952fefSHong Zhang m = a->compressedrow.nrows; 147897952fefSHong Zhang ii = a->compressedrow.i; 147997952fefSHong Zhang ridx = a->compressedrow.rindex; 148097952fefSHong Zhang for (i = 0; i < m; i++) { 148197952fefSHong Zhang n = ii[i + 1] - ii[i]; 148297952fefSHong Zhang aj = a->j + ii[i]; 1483fff043a9SJunchao Zhang aa = a_a + ii[i]; 148497952fefSHong Zhang sum = 0.0; 1485003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1486003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 148797952fefSHong Zhang y[*ridx++] = sum; 148897952fefSHong Zhang } 148997952fefSHong Zhang } else { /* do not use compressed row format */ 1490b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14913d3eaba7SBarry Smith aj = a->j; 1492fff043a9SJunchao Zhang aa = a_a; 1493b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1494b05257ddSBarry Smith #else 149517ab2063SBarry Smith for (i = 0; i < m; i++) { 1496003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1497003131ecSBarry Smith aj = a->j + ii[i]; 1498fff043a9SJunchao Zhang aa = a_a + ii[i]; 149917ab2063SBarry Smith sum = 0.0; 1500003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150117ab2063SBarry Smith y[i] = sum; 150217ab2063SBarry Smith } 15038d195f9aSBarry Smith #endif 1504b05257ddSBarry Smith } 15059566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15079566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15093a40ed3dSBarry Smith PetscFunctionReturn(0); 151017ab2063SBarry Smith } 151117ab2063SBarry Smith 1512d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1513d71ae5a4SJacob Faibussowitsch { 1514b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1515b434eb95SMatthew G. Knepley PetscScalar *y; 1516b434eb95SMatthew G. Knepley const PetscScalar *x; 1517fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1518b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1519b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1520b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1521b434eb95SMatthew G. Knepley PetscScalar sum; 1522b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1523b434eb95SMatthew G. Knepley 1524b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1525b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1526b434eb95SMatthew G. Knepley #endif 1527b434eb95SMatthew G. Knepley 1528b434eb95SMatthew G. Knepley PetscFunctionBegin; 15299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15319566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1532b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1533b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1534b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1535b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1536b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1537b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1538b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1539fff043a9SJunchao Zhang aa = a_a + ii[i]; 1540b434eb95SMatthew G. Knepley sum = 0.0; 1541b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1542b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1543b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1544b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1545b434eb95SMatthew G. Knepley } 1546b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15473d3eaba7SBarry Smith ii = a->i; 1548b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1549b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1550b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1551fff043a9SJunchao Zhang aa = a_a + ii[i]; 1552b434eb95SMatthew G. Knepley sum = 0.0; 1553b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1554b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1555b434eb95SMatthew G. Knepley y[i] = sum; 1556b434eb95SMatthew G. Knepley } 1557b434eb95SMatthew G. Knepley } 15589566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15609566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1562b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1563b434eb95SMatthew G. Knepley } 1564b434eb95SMatthew G. Knepley 1565d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1566d71ae5a4SJacob Faibussowitsch { 1567b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1568b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1569b434eb95SMatthew G. Knepley const PetscScalar *x; 1570fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1571b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1572b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1573b434eb95SMatthew G. Knepley PetscScalar sum; 1574b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1575b434eb95SMatthew G. Knepley 1576b434eb95SMatthew G. Knepley PetscFunctionBegin; 15779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15799566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1580b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158148a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1582b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1583b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1584b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1585b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1586b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1587b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1588fff043a9SJunchao Zhang aa = a_a + ii[i]; 1589b434eb95SMatthew G. Knepley sum = y[*ridx]; 1590b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1591b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1592b434eb95SMatthew G. Knepley } 1593b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15943d3eaba7SBarry Smith ii = a->i; 1595b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1596b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1597b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1598fff043a9SJunchao Zhang aa = a_a + ii[i]; 1599b434eb95SMatthew G. Knepley sum = y[i]; 1600b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1601b434eb95SMatthew G. Knepley z[i] = sum; 1602b434eb95SMatthew G. Knepley } 1603b434eb95SMatthew G. Knepley } 16049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 1608b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1609b434eb95SMatthew G. Knepley } 1610b434eb95SMatthew G. Knepley 1611c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1612d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1613d71ae5a4SJacob Faibussowitsch { 1614416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1615f15663dcSBarry Smith PetscScalar *y, *z; 1616f15663dcSBarry Smith const PetscScalar *x; 1617fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1618d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1619d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1620362ced78SSatish Balay PetscScalar sum; 1621ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16229ea0dfa2SSatish Balay 16233a40ed3dSBarry Smith PetscFunctionBegin; 1624b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16259566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 1626b215bc84SStefano Zampini PetscFunctionReturn(0); 1627b215bc84SStefano Zampini } 16289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16309566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16314eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 163397952fefSHong Zhang m = a->compressedrow.nrows; 163497952fefSHong Zhang ii = a->compressedrow.i; 163597952fefSHong Zhang ridx = a->compressedrow.rindex; 163697952fefSHong Zhang for (i = 0; i < m; i++) { 163797952fefSHong Zhang n = ii[i + 1] - ii[i]; 163897952fefSHong Zhang aj = a->j + ii[i]; 1639fff043a9SJunchao Zhang aa = a_a + ii[i]; 164097952fefSHong Zhang sum = y[*ridx]; 1641f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164297952fefSHong Zhang z[*ridx++] = sum; 164397952fefSHong Zhang } 164497952fefSHong Zhang } else { /* do not use compressed row format */ 16453d3eaba7SBarry Smith ii = a->i; 1646f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16473d3eaba7SBarry Smith aj = a->j; 1648fff043a9SJunchao Zhang aa = a_a; 1649f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1650f15663dcSBarry Smith #else 165117ab2063SBarry Smith for (i = 0; i < m; i++) { 1652f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1653f15663dcSBarry Smith aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165517ab2063SBarry Smith sum = y[i]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165717ab2063SBarry Smith z[i] = sum; 165817ab2063SBarry Smith } 165902ab625aSSatish Balay #endif 1660f15663dcSBarry Smith } 16619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16629566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16653a40ed3dSBarry Smith PetscFunctionReturn(0); 166617ab2063SBarry Smith } 166717ab2063SBarry Smith 166817ab2063SBarry Smith /* 166917ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167017ab2063SBarry Smith */ 1671d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1672d71ae5a4SJacob Faibussowitsch { 1673416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1674d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1675c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 167617ab2063SBarry Smith 16773a40ed3dSBarry Smith PetscFunctionBegin; 167809f38230SBarry Smith if (!a->diag) { 16799566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1680c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168109f38230SBarry Smith } 1682d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1683c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1684c0c07093SJunchao Zhang if (alreadySet) { 1685c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1686c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1687c0c07093SJunchao Zhang } 1688c0c07093SJunchao Zhang 168909f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1690bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1691bfeeae90SHong Zhang if (a->j[j] == i) { 169209f38230SBarry Smith a->diag[i] = j; 169317ab2063SBarry Smith break; 169417ab2063SBarry Smith } 169517ab2063SBarry Smith } 169617ab2063SBarry Smith } 16973a40ed3dSBarry Smith PetscFunctionReturn(0); 169817ab2063SBarry Smith } 169917ab2063SBarry Smith 1700d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1701d71ae5a4SJacob Faibussowitsch { 170261ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170361ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 170461ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 170561ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 170661ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 170761ecd0c6SBarry Smith 170861ecd0c6SBarry Smith PetscFunctionBegin; 170961ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17119566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 171261ecd0c6SBarry Smith PetscFunctionReturn(0); 171361ecd0c6SBarry Smith } 171461ecd0c6SBarry Smith 171561ecd0c6SBarry Smith if (a->diagonaldense) { 171661ecd0c6SBarry Smith cnt = 0; 171761ecd0c6SBarry Smith } else { 17189566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 171961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1720349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172161ecd0c6SBarry Smith cnt++; 172261ecd0c6SBarry Smith mdiag[i] = 1; 172361ecd0c6SBarry Smith } 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith } 172661ecd0c6SBarry Smith if (!cnt) { 17279566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 172861ecd0c6SBarry Smith } else { 1729b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1730b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 173161ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 173261ecd0c6SBarry Smith 173361ecd0c6SBarry Smith a->a = NULL; 173461ecd0c6SBarry Smith a->j = NULL; 173561ecd0c6SBarry Smith a->i = NULL; 173661ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1737ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 173961ecd0c6SBarry Smith 174061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 174161ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17429566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 174348a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1744447d62f5SStefano Zampini } 17459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 174761ecd0c6SBarry Smith if (singlemalloc) { 17489566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 174961ecd0c6SBarry Smith } else { 17509566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17519566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17529566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 175361ecd0c6SBarry Smith } 175461ecd0c6SBarry Smith } 17559566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 175661ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 175761ecd0c6SBarry Smith PetscFunctionReturn(0); 175861ecd0c6SBarry Smith } 175961ecd0c6SBarry Smith 1760be5855fcSBarry Smith /* 1761be5855fcSBarry Smith Checks for missing diagonals 1762be5855fcSBarry Smith */ 1763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1764d71ae5a4SJacob Faibussowitsch { 1765be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17667734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1767be5855fcSBarry Smith 1768be5855fcSBarry Smith PetscFunctionBegin; 176909f38230SBarry Smith *missing = PETSC_FALSE; 17707734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177109f38230SBarry Smith *missing = PETSC_TRUE; 177209f38230SBarry Smith if (d) *d = 0; 17739566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 177409f38230SBarry Smith } else { 177501445905SHong Zhang PetscInt n; 177601445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1777f1e2ffcdSBarry Smith diag = a->diag; 177801445905SHong Zhang for (i = 0; i < n; i++) { 17797734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178009f38230SBarry Smith *missing = PETSC_TRUE; 178109f38230SBarry Smith if (d) *d = i; 17829566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1783358d2f5dSShri Abhyankar break; 178409f38230SBarry Smith } 1785be5855fcSBarry Smith } 1786be5855fcSBarry Smith } 1787be5855fcSBarry Smith PetscFunctionReturn(0); 1788be5855fcSBarry Smith } 1789be5855fcSBarry Smith 17900da83c2eSBarry Smith #include <petscblaslapack.h> 17910da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17920da83c2eSBarry Smith 17930da83c2eSBarry Smith /* 17940da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17950da83c2eSBarry Smith */ 1796d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1797d71ae5a4SJacob Faibussowitsch { 17980da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 17990da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18000da83c2eSBarry Smith const PetscReal shift = 0.0; 18010da83c2eSBarry Smith PetscInt ipvt[5]; 18020da83c2eSBarry Smith PetscScalar work[25], *v_work; 18030da83c2eSBarry Smith 18040da83c2eSBarry Smith PetscFunctionBegin; 18050da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18060da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 180708401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1808ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18110da83c2eSBarry Smith ncnt = 0; 18120da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18130da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18150da83c2eSBarry Smith switch (bsizes[i]) { 1816d71ae5a4SJacob Faibussowitsch case 1: 1817d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1818d71ae5a4SJacob Faibussowitsch break; 18190da83c2eSBarry Smith case 2: 18209566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18210da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18230da83c2eSBarry Smith break; 18240da83c2eSBarry Smith case 3: 18259566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18260da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18280da83c2eSBarry Smith break; 18290da83c2eSBarry Smith case 4: 18309566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18310da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18330da83c2eSBarry Smith break; 18340da83c2eSBarry Smith case 5: 18359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18360da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18380da83c2eSBarry Smith break; 18390da83c2eSBarry Smith case 6: 18409566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18430da83c2eSBarry Smith break; 18440da83c2eSBarry Smith case 7: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith default: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18530da83c2eSBarry Smith } 18540da83c2eSBarry Smith ncnt += bsizes[i]; 18550da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18560da83c2eSBarry Smith } 185748a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18589566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18590da83c2eSBarry Smith PetscFunctionReturn(0); 18600da83c2eSBarry Smith } 18610da83c2eSBarry Smith 1862422a814eSBarry Smith /* 1863422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1864422a814eSBarry Smith */ 1865d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1866d71ae5a4SJacob Faibussowitsch { 186771f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1868d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18692e5835c6SStefano Zampini const MatScalar *v; 187054f21887SBarry Smith PetscScalar *idiag, *mdiag; 187171f1c65dSBarry Smith 187271f1c65dSBarry Smith PetscFunctionBegin; 187371f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 18749566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 187571f1c65dSBarry Smith diag = a->diag; 18764dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18772e5835c6SStefano Zampini 187871f1c65dSBarry Smith mdiag = a->mdiag; 187971f1c65dSBarry Smith idiag = a->idiag; 18809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1881422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 188271f1c65dSBarry Smith for (i = 0; i < m; i++) { 188371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1884899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1885899639b0SHong Zhang if (PetscRealPart(fshift)) { 18869566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18877b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18887b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18897b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1891899639b0SHong Zhang } 189271f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 189371f1c65dSBarry Smith } 18949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 189571f1c65dSBarry Smith } else { 189671f1c65dSBarry Smith for (i = 0; i < m; i++) { 189771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 189871f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 189971f1c65dSBarry Smith } 19009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 190171f1c65dSBarry Smith } 190271f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 190471f1c65dSBarry Smith PetscFunctionReturn(0); 190571f1c65dSBarry Smith } 190671f1c65dSBarry Smith 1907c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1908d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1909d71ae5a4SJacob Faibussowitsch { 1910416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1911e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19122e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 191354f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19143d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 191597f1f81fSBarry Smith const PetscInt *idx, *diag; 191617ab2063SBarry Smith 19173a40ed3dSBarry Smith PetscFunctionBegin; 1918b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19199566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 1920b215bc84SStefano Zampini PetscFunctionReturn(0); 1921b215bc84SStefano Zampini } 1922b965ef7fSBarry Smith its = its * lits; 192391723122SBarry Smith 192471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19259566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 192671f1c65dSBarry Smith a->fshift = fshift; 192771f1c65dSBarry Smith a->omega = omega; 1928ed480e8bSBarry Smith 192971f1c65dSBarry Smith diag = a->diag; 193071f1c65dSBarry Smith t = a->ssor_work; 1931ed480e8bSBarry Smith idiag = a->idiag; 193271f1c65dSBarry Smith mdiag = a->mdiag; 1933ed480e8bSBarry Smith 19349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19359566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19369566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1937ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 193817ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 193917ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1940ed480e8bSBarry Smith bs = b; 194117ab2063SBarry Smith for (i = 0; i < m; i++) { 194271f1c65dSBarry Smith d = fshift + mdiag[i]; 1943416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1944ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19452e5835c6SStefano Zampini v = aa + diag[i] + 1; 194617ab2063SBarry Smith sum = b[i] * d / omega; 1947003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 194817ab2063SBarry Smith x[i] = sum; 194917ab2063SBarry Smith } 19509566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19543a40ed3dSBarry Smith PetscFunctionReturn(0); 195517ab2063SBarry Smith } 1956c783ea89SBarry Smith 195708401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1958f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19594c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1960887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196117ab2063SBarry Smith 196217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 196317ab2063SBarry Smith 1964887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 196517ab2063SBarry Smith */ 196617ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 196717ab2063SBarry Smith 196817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 196917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1970416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1971ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19722e5835c6SStefano Zampini v = aa + diag[i] + 1; 197317ab2063SBarry Smith sum = b[i]; 1974e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1975ed480e8bSBarry Smith x[i] = sum * idiag[i]; 197617ab2063SBarry Smith } 197717ab2063SBarry Smith 197817ab2063SBarry Smith /* t = b - (2*E - D)x */ 19792e5835c6SStefano Zampini v = aa; 19802205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198117ab2063SBarry Smith 198217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1983ed480e8bSBarry Smith ts = t; 1984416022c9SBarry Smith diag = a->diag; 198517ab2063SBarry Smith for (i = 0; i < m; i++) { 1986416022c9SBarry Smith n = diag[i] - a->i[i]; 1987ed480e8bSBarry Smith idx = a->j + a->i[i]; 19882e5835c6SStefano Zampini v = aa + a->i[i]; 198917ab2063SBarry Smith sum = t[i]; 1990003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1991ed480e8bSBarry Smith t[i] = sum * idiag[i]; 1992733d66baSBarry Smith /* x = x + t */ 1993733d66baSBarry Smith x[i] += t[i]; 199417ab2063SBarry Smith } 199517ab2063SBarry Smith 19969566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 19979566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19989566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19993a40ed3dSBarry Smith PetscFunctionReturn(0); 200017ab2063SBarry Smith } 200117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 200217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 200317ab2063SBarry Smith for (i = 0; i < m; i++) { 2004416022c9SBarry Smith n = diag[i] - a->i[i]; 2005ed480e8bSBarry Smith idx = a->j + a->i[i]; 20062e5835c6SStefano Zampini v = aa + a->i[i]; 200717ab2063SBarry Smith sum = b[i]; 2008e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20095c99c7daSBarry Smith t[i] = sum; 2010ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201117ab2063SBarry Smith } 20125c99c7daSBarry Smith xb = t; 20139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20143a40ed3dSBarry Smith } else xb = b; 201517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 201617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2017416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2018ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20192e5835c6SStefano Zampini v = aa + diag[i] + 1; 202017ab2063SBarry Smith sum = xb[i]; 2021e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20225c99c7daSBarry Smith if (xb == b) { 2023ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20245c99c7daSBarry Smith } else { 2025b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 202617ab2063SBarry Smith } 20275c99c7daSBarry Smith } 20289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 202917ab2063SBarry Smith } 203017ab2063SBarry Smith its--; 203117ab2063SBarry Smith } 203217ab2063SBarry Smith while (its--) { 203317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203417ab2063SBarry Smith for (i = 0; i < m; i++) { 2035b19a5dc2SMark Adams /* lower */ 2036b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2037ed480e8bSBarry Smith idx = a->j + a->i[i]; 20382e5835c6SStefano Zampini v = aa + a->i[i]; 203917ab2063SBarry Smith sum = b[i]; 2040e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2041b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2042b19a5dc2SMark Adams /* upper */ 2043b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2044b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20452e5835c6SStefano Zampini v = aa + diag[i] + 1; 2046b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2047b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204817ab2063SBarry Smith } 2049b19a5dc2SMark Adams xb = t; 20509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2051b19a5dc2SMark Adams } else xb = b; 205217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 205317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2054b19a5dc2SMark Adams sum = xb[i]; 2055b19a5dc2SMark Adams if (xb == b) { 2056b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2057416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2058ed480e8bSBarry Smith idx = a->j + a->i[i]; 20592e5835c6SStefano Zampini v = aa + a->i[i]; 2060e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2061ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2062b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2063b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2064b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20652e5835c6SStefano Zampini v = aa + diag[i] + 1; 2066b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2067b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206817ab2063SBarry Smith } 2069b19a5dc2SMark Adams } 2070b19a5dc2SMark Adams if (xb == b) { 20719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2072b19a5dc2SMark Adams } else { 20739566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2074b19a5dc2SMark Adams } 207517ab2063SBarry Smith } 207617ab2063SBarry Smith } 20779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20789566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 2080365a8a9eSBarry Smith PetscFunctionReturn(0); 208117ab2063SBarry Smith } 208217ab2063SBarry Smith 2083d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2084d71ae5a4SJacob Faibussowitsch { 2085416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20864e220ebcSLois Curfman McInnes 20873a40ed3dSBarry Smith PetscFunctionBegin; 20884e220ebcSLois Curfman McInnes info->block_size = 1.0; 20893966268fSBarry Smith info->nz_allocated = a->maxnz; 20903966268fSBarry Smith info->nz_used = a->nz; 20913966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20923966268fSBarry Smith info->assemblies = A->num_ass; 20933966268fSBarry Smith info->mallocs = A->info.mallocs; 20944dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2095d5f3da31SBarry Smith if (A->factortype) { 20964e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20974e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20984e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 20994e220ebcSLois Curfman McInnes } else { 21004e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21014e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21024e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21034e220ebcSLois Curfman McInnes } 21043a40ed3dSBarry Smith PetscFunctionReturn(0); 210517ab2063SBarry Smith } 210617ab2063SBarry Smith 2107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2108d71ae5a4SJacob Faibussowitsch { 2109416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2110c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211197b48c8fSBarry Smith const PetscScalar *xx; 21122e5835c6SStefano Zampini PetscScalar *bb, *aa; 2113c7da8527SEric Chamberland PetscInt d = 0; 211417ab2063SBarry Smith 21153a40ed3dSBarry Smith PetscFunctionBegin; 211697b48c8fSBarry Smith if (x && b) { 21179566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21189566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 211997b48c8fSBarry Smith for (i = 0; i < N; i++) { 2120aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2121447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 212297b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 212397b48c8fSBarry Smith } 21249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21259566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 212697b48c8fSBarry Smith } 212797b48c8fSBarry Smith 21289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2129a9817697SBarry Smith if (a->keepnonzeropattern) { 2130f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2131aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21329566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2133f1e2ffcdSBarry Smith } 2134f4df32b1SMatthew Knepley if (diag != 0.0) { 2135c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2136c7da8527SEric Chamberland d = rows[i]; 2137447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213808401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2139c7da8527SEric Chamberland } 2140f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2141447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21422e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2143f1e2ffcdSBarry Smith } 2144f1e2ffcdSBarry Smith } 2145f1e2ffcdSBarry Smith } else { 2146f4df32b1SMatthew Knepley if (diag != 0.0) { 214717ab2063SBarry Smith for (i = 0; i < N; i++) { 2148aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21497ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2150447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2151447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2152447d62f5SStefano Zampini } else { 2153416022c9SBarry Smith a->ilen[rows[i]] = 1; 21542e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2155bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2156447d62f5SStefano Zampini } 2157447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21589566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 215917ab2063SBarry Smith } 216017ab2063SBarry Smith } 21613a40ed3dSBarry Smith } else { 216217ab2063SBarry Smith for (i = 0; i < N; i++) { 2163aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2164416022c9SBarry Smith a->ilen[rows[i]] = 0; 216517ab2063SBarry Smith } 216617ab2063SBarry Smith } 2167e56f5c9eSBarry Smith A->nonzerostate++; 2168f1e2ffcdSBarry Smith } 21699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2170dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21713a40ed3dSBarry Smith PetscFunctionReturn(0); 217217ab2063SBarry Smith } 217317ab2063SBarry Smith 2174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2175d71ae5a4SJacob Faibussowitsch { 21766e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21776e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21782b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21796e169961SBarry Smith const PetscScalar *xx; 21802e5835c6SStefano Zampini PetscScalar *bb, *aa; 21816e169961SBarry Smith 21826e169961SBarry Smith PetscFunctionBegin; 21832e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 21849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21856e169961SBarry Smith if (x && b) { 21869566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21879566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21882b40b63fSBarry Smith vecs = PETSC_TRUE; 21896e169961SBarry Smith } 21909566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21916e169961SBarry Smith for (i = 0; i < N; i++) { 2192aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21939566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 21942205254eSKarl Rupp 21956e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21966e169961SBarry Smith } 21976e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 21986e169961SBarry Smith if (!zeroed[i]) { 21996e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22004cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22012e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22022e5835c6SStefano Zampini aa[j] = 0.0; 22036e169961SBarry Smith } 22046e169961SBarry Smith } 22054cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22066e169961SBarry Smith } 22076e169961SBarry Smith if (x && b) { 22089566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22099566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22106e169961SBarry Smith } 22119566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22126e169961SBarry Smith if (diag != 0.0) { 22139566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22141d5a398dSstefano_zampini if (missing) { 22151d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22164cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2217aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22189566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22191d5a398dSstefano_zampini } 22201d5a398dSstefano_zampini } else { 2221ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22226e169961SBarry Smith } 22231d5a398dSstefano_zampini } 22249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2225dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22266e169961SBarry Smith PetscFunctionReturn(0); 22276e169961SBarry Smith } 22286e169961SBarry Smith 2229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2230d71ae5a4SJacob Faibussowitsch { 2231fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2232fff043a9SJunchao Zhang const PetscScalar *aa; 2233fff043a9SJunchao Zhang PetscInt *itmp; 223417ab2063SBarry Smith 22353a40ed3dSBarry Smith PetscFunctionBegin; 22369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2237416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22382e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 223917ab2063SBarry Smith if (idx) { 2240bfeeae90SHong Zhang itmp = a->j + a->i[row]; 224126fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2242f4259b30SLisandro Dalcin else *idx = NULL; 224317ab2063SBarry Smith } 22449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22453a40ed3dSBarry Smith PetscFunctionReturn(0); 224617ab2063SBarry Smith } 224717ab2063SBarry Smith 2248d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2249d71ae5a4SJacob Faibussowitsch { 22503a40ed3dSBarry Smith PetscFunctionBegin; 2251cb4a9cd9SHong Zhang if (nz) *nz = 0; 22522e5835c6SStefano Zampini if (idx) *idx = NULL; 22532e5835c6SStefano Zampini if (v) *v = NULL; 22543a40ed3dSBarry Smith PetscFunctionReturn(0); 225517ab2063SBarry Smith } 225617ab2063SBarry Smith 2257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2258d71ae5a4SJacob Faibussowitsch { 2259416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22602e5835c6SStefano Zampini const MatScalar *v; 226136db0b34SBarry Smith PetscReal sum = 0.0; 226297f1f81fSBarry Smith PetscInt i, j; 226317ab2063SBarry Smith 22643a40ed3dSBarry Smith PetscFunctionBegin; 22659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 226617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2267570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2268570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2269792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2270570b7f6dSBarry Smith #else 2271416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22729371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22739371c9d4SSatish Balay v++; 227417ab2063SBarry Smith } 22758f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2276570b7f6dSBarry Smith #endif 22779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22783a40ed3dSBarry Smith } else if (type == NORM_1) { 227936db0b34SBarry Smith PetscReal *tmp; 228097f1f81fSBarry Smith PetscInt *jj = a->j; 22819566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2282064f8208SBarry Smith *nrm = 0.0; 2283416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22849371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22859371c9d4SSatish Balay v++; 228617ab2063SBarry Smith } 2287d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2288064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 228917ab2063SBarry Smith } 22909566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22919566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22923a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2293064f8208SBarry Smith *nrm = 0.0; 2294d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22952e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 229617ab2063SBarry Smith sum = 0.0; 2297416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 22989371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 22999371c9d4SSatish Balay v2++; 230017ab2063SBarry Smith } 2301064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230217ab2063SBarry Smith } 23039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2304f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23063a40ed3dSBarry Smith PetscFunctionReturn(0); 230717ab2063SBarry Smith } 230817ab2063SBarry Smith 2309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2310d71ae5a4SJacob Faibussowitsch { 23113d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231254f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23132e5835c6SStefano Zampini const MatScalar *va, *vb; 231497f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2315cd0d46ebSvictorle 2316cd0d46ebSvictorle PetscFunctionBegin; 23179566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23189566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23195485867bSBarry Smith if (ma != nb || na != mb) { 23205485867bSBarry Smith *f = PETSC_FALSE; 23215485867bSBarry Smith PetscFunctionReturn(0); 23225485867bSBarry Smith } 23239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23259371c9d4SSatish Balay aii = aij->i; 23269371c9d4SSatish Balay bii = bij->i; 23279371c9d4SSatish Balay adx = aij->j; 23289371c9d4SSatish Balay bdx = bij->j; 23299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2331cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2332cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2333cd0d46ebSvictorle 2334cd0d46ebSvictorle *f = PETSC_TRUE; 2335cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2336cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 233797f1f81fSBarry Smith PetscInt idc, idr; 23385485867bSBarry Smith PetscScalar vc, vr; 2339cd0d46ebSvictorle /* column/row index/value */ 23405485867bSBarry Smith idc = adx[aptr[i]]; 23415485867bSBarry Smith idr = bdx[bptr[idc]]; 23425485867bSBarry Smith vc = va[aptr[i]]; 23435485867bSBarry Smith vr = vb[bptr[idc]]; 23445485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23455485867bSBarry Smith *f = PETSC_FALSE; 23465485867bSBarry Smith goto done; 2347cd0d46ebSvictorle } else { 23485485867bSBarry Smith aptr[i]++; 23495485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2350cd0d46ebSvictorle } 2351cd0d46ebSvictorle } 2352cd0d46ebSvictorle } 2353cd0d46ebSvictorle done: 23549566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23559566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 2358cd0d46ebSvictorle PetscFunctionReturn(0); 2359cd0d46ebSvictorle } 2360cd0d46ebSvictorle 2361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2362d71ae5a4SJacob Faibussowitsch { 23633d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236454f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236554f21887SBarry Smith MatScalar *va, *vb; 23661cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23671cbb95d3SBarry Smith 23681cbb95d3SBarry Smith PetscFunctionBegin; 23699566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23709566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23711cbb95d3SBarry Smith if (ma != nb || na != mb) { 23721cbb95d3SBarry Smith *f = PETSC_FALSE; 23731cbb95d3SBarry Smith PetscFunctionReturn(0); 23741cbb95d3SBarry Smith } 23759371c9d4SSatish Balay aii = aij->i; 23769371c9d4SSatish Balay bii = bij->i; 23779371c9d4SSatish Balay adx = aij->j; 23789371c9d4SSatish Balay bdx = bij->j; 23799371c9d4SSatish Balay va = aij->a; 23809371c9d4SSatish Balay vb = bij->a; 23819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23831cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23841cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23851cbb95d3SBarry Smith 23861cbb95d3SBarry Smith *f = PETSC_TRUE; 23871cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23881cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23891cbb95d3SBarry Smith PetscInt idc, idr; 23901cbb95d3SBarry Smith PetscScalar vc, vr; 23911cbb95d3SBarry Smith /* column/row index/value */ 23921cbb95d3SBarry Smith idc = adx[aptr[i]]; 23931cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23941cbb95d3SBarry Smith vc = va[aptr[i]]; 23951cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23961cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 23971cbb95d3SBarry Smith *f = PETSC_FALSE; 23981cbb95d3SBarry Smith goto done; 23991cbb95d3SBarry Smith } else { 24001cbb95d3SBarry Smith aptr[i]++; 24011cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24021cbb95d3SBarry Smith } 24031cbb95d3SBarry Smith } 24041cbb95d3SBarry Smith } 24051cbb95d3SBarry Smith done: 24069566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24079566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24081cbb95d3SBarry Smith PetscFunctionReturn(0); 24091cbb95d3SBarry Smith } 24101cbb95d3SBarry Smith 2411d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2412d71ae5a4SJacob Faibussowitsch { 24139e29f15eSvictorle PetscFunctionBegin; 24149566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24159e29f15eSvictorle PetscFunctionReturn(0); 24169e29f15eSvictorle } 24179e29f15eSvictorle 2418d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2419d71ae5a4SJacob Faibussowitsch { 24201cbb95d3SBarry Smith PetscFunctionBegin; 24219566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24221cbb95d3SBarry Smith PetscFunctionReturn(0); 24231cbb95d3SBarry Smith } 24241cbb95d3SBarry Smith 2425d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2426d71ae5a4SJacob Faibussowitsch { 2427416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2428fff8e43fSBarry Smith const PetscScalar *l, *r; 2429fff8e43fSBarry Smith PetscScalar x; 243054f21887SBarry Smith MatScalar *v; 2431fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2432fff8e43fSBarry Smith const PetscInt *jj; 243317ab2063SBarry Smith 24343a40ed3dSBarry Smith PetscFunctionBegin; 243517ab2063SBarry Smith if (ll) { 24363ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24373ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24389566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 243908401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24409566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244217ab2063SBarry Smith for (i = 0; i < m; i++) { 244317ab2063SBarry Smith x = l[i]; 2444416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24452205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244617ab2063SBarry Smith } 24479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24489566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245017ab2063SBarry Smith } 245117ab2063SBarry Smith if (rr) { 24529566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245308401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24549566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24562e5835c6SStefano Zampini jj = a->j; 24572205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24609566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246117ab2063SBarry Smith } 24629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24633a40ed3dSBarry Smith PetscFunctionReturn(0); 246417ab2063SBarry Smith } 246517ab2063SBarry Smith 2466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2467d71ae5a4SJacob Faibussowitsch { 2468db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2469d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247097f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24715d0c19d7SBarry Smith const PetscInt *irow, *icol; 24722e5835c6SStefano Zampini const PetscScalar *aa; 24735d0c19d7SBarry Smith PetscInt nrows, ncols; 247497f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 247554f21887SBarry Smith MatScalar *a_new, *mat_a; 2476416022c9SBarry Smith Mat C; 2477cdc6f3adSToby Isaac PetscBool stride; 247817ab2063SBarry Smith 24793a40ed3dSBarry Smith PetscFunctionBegin; 24809566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24819566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248317ab2063SBarry Smith 24849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2485ff718158SBarry Smith if (stride) { 24869566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2487ff718158SBarry Smith } else { 2488ff718158SBarry Smith first = 0; 2489ff718158SBarry Smith step = 0; 2490ff718158SBarry Smith } 2491fee21e36SBarry Smith if (stride && step == 1) { 249202834360SBarry Smith /* special case of contiguous rows */ 24939566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249402834360SBarry Smith /* loop over new rows determining lens and starting points */ 249502834360SBarry Smith for (i = 0; i < nrows; i++) { 2496bfeeae90SHong Zhang kstart = ai[irow[i]]; 2497a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2498a91a9bebSLisandro Dalcin starts[i] = kstart; 249902834360SBarry Smith for (k = kstart; k < kend; k++) { 2500bfeeae90SHong Zhang if (aj[k] >= first) { 250102834360SBarry Smith starts[i] = k; 250202834360SBarry Smith break; 250302834360SBarry Smith } 250402834360SBarry Smith } 2505a2744918SBarry Smith sum = 0; 250602834360SBarry Smith while (k < kend) { 2507bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2508a2744918SBarry Smith sum++; 250902834360SBarry Smith } 2510a2744918SBarry Smith lens[i] = sum; 251102834360SBarry Smith } 251202834360SBarry Smith /* create submatrix */ 2513cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251497f1f81fSBarry Smith PetscInt n_cols, n_rows; 25159566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2516aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25179566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251808480c60SBarry Smith C = *B; 25193a40ed3dSBarry Smith } else { 25203bef6203SJed Brown PetscInt rbs, cbs; 25219566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25229566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25239566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25249566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25259566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252808480c60SBarry Smith } 2529db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2530db02288aSLois Curfman McInnes 253102834360SBarry Smith /* loop over rows inserting into submatrix */ 2532db02288aSLois Curfman McInnes a_new = c->a; 2533db02288aSLois Curfman McInnes j_new = c->j; 2534db02288aSLois Curfman McInnes i_new = c->i; 25359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253602834360SBarry Smith for (i = 0; i < nrows; i++) { 2537a2744918SBarry Smith ii = starts[i]; 2538a2744918SBarry Smith lensi = lens[i]; 2539ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2541a2744918SBarry Smith a_new += lensi; 2542a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2543a2744918SBarry Smith c->ilen[i] = lensi; 254402834360SBarry Smith } 25459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25469566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25473a40ed3dSBarry Smith } else { 25489566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25499566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25514dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25526bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25534dcab191SBarry Smith smap[icol[i]] = i + 1; 25544dcab191SBarry Smith } 25554dcab191SBarry Smith 255602834360SBarry Smith /* determine lens of each row */ 255702834360SBarry Smith for (i = 0; i < nrows; i++) { 2558bfeeae90SHong Zhang kstart = ai[irow[i]]; 255902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256002834360SBarry Smith lens[i] = 0; 256102834360SBarry Smith for (k = kstart; k < kend; k++) { 2562ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256302834360SBarry Smith } 256402834360SBarry Smith } 256517ab2063SBarry Smith /* Create and fill new matrix */ 2566a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2567ace3abfcSBarry Smith PetscBool equal; 25680f5bd95cSBarry Smith 256999141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2570aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25719566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 257228b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25739566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257408480c60SBarry Smith C = *B; 25753a40ed3dSBarry Smith } else { 25763bef6203SJed Brown PetscInt rbs, cbs; 25779566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25789566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25799566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25809566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258408480c60SBarry Smith } 25859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 258699141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 258717ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258899141d43SSatish Balay row = irow[i]; 2589bfeeae90SHong Zhang kstart = ai[row]; 259099141d43SSatish Balay kend = kstart + a->ilen[row]; 2591bfeeae90SHong Zhang mat_i = c->i[i]; 259299141d43SSatish Balay mat_j = c->j + mat_i; 259399141d43SSatish Balay mat_a = c->a + mat_i; 259499141d43SSatish Balay mat_ilen = c->ilen + i; 259517ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2596bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2597ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25982e5835c6SStefano Zampini *mat_a++ = aa[k]; 259999141d43SSatish Balay (*mat_ilen)++; 260017ab2063SBarry Smith } 260117ab2063SBarry Smith } 260217ab2063SBarry Smith } 26039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260402834360SBarry Smith /* Free work space */ 26059566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26069566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26079566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2608cdc6f3adSToby Isaac /* sort */ 2609cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2610cdc6f3adSToby Isaac PetscInt ilen; 2611cdc6f3adSToby Isaac 2612cdc6f3adSToby Isaac mat_i = c->i[i]; 2613cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2614cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2615cdc6f3adSToby Isaac ilen = c->ilen[i]; 26169566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2617cdc6f3adSToby Isaac } 261802834360SBarry Smith } 26198c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26209566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2621305c6ccfSStefano Zampini #endif 26229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262417ab2063SBarry Smith 26259566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2626416022c9SBarry Smith *B = C; 26273a40ed3dSBarry Smith PetscFunctionReturn(0); 262817ab2063SBarry Smith } 262917ab2063SBarry Smith 2630d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2631d71ae5a4SJacob Faibussowitsch { 263282d44351SHong Zhang Mat B; 263382d44351SHong Zhang 263482d44351SHong Zhang PetscFunctionBegin; 2635c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26369566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26389566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26409566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264182d44351SHong Zhang *subMat = B; 2642c2d650bdSHong Zhang } else { 26439566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2644c2d650bdSHong Zhang } 264582d44351SHong Zhang PetscFunctionReturn(0); 264682d44351SHong Zhang } 264782d44351SHong Zhang 2648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2649d71ae5a4SJacob Faibussowitsch { 265063b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265163b91edcSBarry Smith Mat outA; 2652ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265363b91edcSBarry Smith 26543a40ed3dSBarry Smith PetscFunctionBegin; 265508401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26561df811f5SHong Zhang 26579566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26589566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2659a871dcd8SBarry Smith 266063b91edcSBarry Smith outA = inA; 2661d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26629566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26639566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26642205254eSKarl Rupp 26659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26672205254eSKarl Rupp 2668c3122656SLisandro Dalcin a->row = row; 26692205254eSKarl Rupp 26709566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26722205254eSKarl Rupp 2673c3122656SLisandro Dalcin a->col = col; 267463b91edcSBarry Smith 267536db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26769566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26779566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2678f0ec6fceSSatish Balay 267994a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268194a9d846SBarry Smith } 268263b91edcSBarry Smith 26839566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2684137fb511SHong Zhang if (row_identity && col_identity) { 26859566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2686137fb511SHong Zhang } else { 26879566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2688137fb511SHong Zhang } 26893a40ed3dSBarry Smith PetscFunctionReturn(0); 2690a871dcd8SBarry Smith } 2691a871dcd8SBarry Smith 2692d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2693d71ae5a4SJacob Faibussowitsch { 2694f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2695dfa0f9e5SStefano Zampini PetscScalar *v; 2696c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26973a40ed3dSBarry Smith 26983a40ed3dSBarry Smith PetscFunctionBegin; 26999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27009566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2701792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27053a40ed3dSBarry Smith PetscFunctionReturn(0); 2706f0b747eeSBarry Smith } 2707f0b747eeSBarry Smith 2708d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2709d71ae5a4SJacob Faibussowitsch { 271016b64355SHong Zhang PetscInt i; 271116b64355SHong Zhang 271216b64355SHong Zhang PetscFunctionBegin; 271316b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27149566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271516b64355SHong Zhang 271648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27179566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271816b64355SHong Zhang 271916b64355SHong Zhang if (submatj->rbuf1) { 27209566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272216b64355SHong Zhang } 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27269566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272716b64355SHong Zhang } 272816b64355SHong Zhang 272916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27309566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap)); 27319566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27329566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273316b64355SHong Zhang #else 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273516b64355SHong Zhang #endif 273616b64355SHong Zhang 273716b64355SHong Zhang if (!submatj->allcolumns) { 273816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 27399566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap)); 274016b64355SHong Zhang #else 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274216b64355SHong Zhang #endif 274316b64355SHong Zhang } 27449566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274516b64355SHong Zhang 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 274716b64355SHong Zhang PetscFunctionReturn(0); 274816b64355SHong Zhang } 274916b64355SHong Zhang 2750d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2751d71ae5a4SJacob Faibussowitsch { 275216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27535c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275416b64355SHong Zhang 275516b64355SHong Zhang PetscFunctionBegin; 27569566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27579566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 275816b64355SHong Zhang PetscFunctionReturn(0); 275916b64355SHong Zhang } 276016b64355SHong Zhang 276189a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2762d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2763d71ae5a4SJacob Faibussowitsch { 27642d033e1fSHong Zhang PetscInt i; 27650fb991dcSHong Zhang Mat C; 27660fb991dcSHong Zhang Mat_SeqAIJ *c; 27670fb991dcSHong Zhang Mat_SubSppt *submatj; 27682d033e1fSHong Zhang 27692d033e1fSHong Zhang PetscFunctionBegin; 27702d033e1fSHong Zhang for (i = 0; i < n; i++) { 27710fb991dcSHong Zhang C = (*mat)[i]; 27720fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27730fb991dcSHong Zhang submatj = c->submatis1; 27742d033e1fSHong Zhang if (submatj) { 2775682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277626cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27779566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27789566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27799566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27803faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27819566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27829566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27839566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2784682e4c99SStefano Zampini } 27852d033e1fSHong Zhang } else { 27869566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27872d033e1fSHong Zhang } 27882d033e1fSHong Zhang } 278986e85357SHong Zhang 279063a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27919566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279263a75b2aSHong Zhang 27939566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27942d033e1fSHong Zhang PetscFunctionReturn(0); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang 2797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2798d71ae5a4SJacob Faibussowitsch { 279997f1f81fSBarry Smith PetscInt i; 2800cddf8d76SBarry Smith 28013a40ed3dSBarry Smith PetscFunctionBegin; 280248a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2803cddf8d76SBarry Smith 280448a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28053a40ed3dSBarry Smith PetscFunctionReturn(0); 2806cddf8d76SBarry Smith } 2807cddf8d76SBarry Smith 2808d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2809d71ae5a4SJacob Faibussowitsch { 2810e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28115d0c19d7SBarry Smith PetscInt row, i, j, k, l, m, n, *nidx, isz, val; 28125d0c19d7SBarry Smith const PetscInt *idx; 281397f1f81fSBarry Smith PetscInt start, end, *ai, *aj; 2814f1af5d2fSBarry Smith PetscBT table; 2815bbd702dbSSatish Balay 28163a40ed3dSBarry Smith PetscFunctionBegin; 2817d0f46423SBarry Smith m = A->rmap->n; 2818e4d965acSSatish Balay ai = a->i; 2819bfeeae90SHong Zhang aj = a->j; 28208a047759SSatish Balay 282108401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282206763907SSatish Balay 28239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28249566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282506763907SSatish Balay 2826e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2827b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2828e4d965acSSatish Balay isz = 0; 28299566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2830e4d965acSSatish Balay 2831e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28329566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28339566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2834e4d965acSSatish Balay 2835dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2836e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28372205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28384dcbc457SBarry Smith } 28399566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2841e4d965acSSatish Balay 284204a348a9SBarry Smith k = 0; 284304a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 284404a348a9SBarry Smith n = isz; 284506763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2846e4d965acSSatish Balay row = nidx[k]; 2847e4d965acSSatish Balay start = ai[row]; 2848e4d965acSSatish Balay end = ai[row + 1]; 284904a348a9SBarry Smith for (l = start; l < end; l++) { 2850efb16452SHong Zhang val = aj[l]; 28512205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2852e4d965acSSatish Balay } 2853e4d965acSSatish Balay } 2854e4d965acSSatish Balay } 28559566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2856e4d965acSSatish Balay } 28579566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28589566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28593a40ed3dSBarry Smith PetscFunctionReturn(0); 28604dcbc457SBarry Smith } 286117ab2063SBarry Smith 28620513a670SBarry Smith /* -------------------------------------------------------------- */ 2863d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2864d71ae5a4SJacob Faibussowitsch { 28650513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28663b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28675d0c19d7SBarry Smith const PetscInt *row, *col; 28685d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 286956cd22aeSBarry Smith IS icolp, irowp; 28700298fd71SBarry Smith PetscInt *cwork = NULL; 28710298fd71SBarry Smith PetscScalar *vwork = NULL; 28720513a670SBarry Smith 28733a40ed3dSBarry Smith PetscFunctionBegin; 28749566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 28759566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 28769566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 28779566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 28780513a670SBarry Smith 28790513a670SBarry Smith /* determine lengths of permuted rows */ 28809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 28812205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 28829566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 28839566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 28849566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 28859566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 28869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 28879566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 28880513a670SBarry Smith 28899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 28900513a670SBarry Smith for (i = 0; i < m; i++) { 28919566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28922205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 28939566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 28949566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 28950513a670SBarry Smith } 28969566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 28972205254eSKarl Rupp 28983c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28992205254eSKarl Rupp 29008c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29019566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29029fe5e383SStefano Zampini #endif 29039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29059566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29079566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29089566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 290948a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29103a40ed3dSBarry Smith PetscFunctionReturn(0); 29110513a670SBarry Smith } 29120513a670SBarry Smith 2913d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2914d71ae5a4SJacob Faibussowitsch { 2915cb5b572fSBarry Smith PetscFunctionBegin; 291633f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 291733f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2918be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2919be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29202e5835c6SStefano Zampini const PetscScalar *aa; 2921be6bf707SBarry Smith 29229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 292308401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29259566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2927cb5b572fSBarry Smith } else { 29289566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2929cb5b572fSBarry Smith } 2930cb5b572fSBarry Smith PetscFunctionReturn(0); 2931cb5b572fSBarry Smith } 2932cb5b572fSBarry Smith 2933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2934d71ae5a4SJacob Faibussowitsch { 2935273d9f13SBarry Smith PetscFunctionBegin; 29369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL)); 2937273d9f13SBarry Smith PetscFunctionReturn(0); 2938273d9f13SBarry Smith } 2939273d9f13SBarry Smith 2940d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2941d71ae5a4SJacob Faibussowitsch { 29426c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29436e111a19SKarl Rupp 29446c0721eeSBarry Smith PetscFunctionBegin; 29456c0721eeSBarry Smith *array = a->a; 29466c0721eeSBarry Smith PetscFunctionReturn(0); 29476c0721eeSBarry Smith } 29486c0721eeSBarry Smith 2949d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2950d71ae5a4SJacob Faibussowitsch { 29516c0721eeSBarry Smith PetscFunctionBegin; 2952f38c1e66SStefano Zampini *array = NULL; 29536c0721eeSBarry Smith PetscFunctionReturn(0); 29546c0721eeSBarry Smith } 2955273d9f13SBarry Smith 29568229c054SShri Abhyankar /* 29578229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29588229c054SShri Abhyankar have different nonzero structure. 29598229c054SShri Abhyankar */ 2960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2961d71ae5a4SJacob Faibussowitsch { 2962b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2963ec7775f6SShri Abhyankar 2964ec7775f6SShri Abhyankar PetscFunctionBegin; 2965ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2966ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 2967b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 2968b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2969b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29708af7cee1SJed Brown nnz[i] = 0; 29718af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2972b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2973b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29748af7cee1SJed Brown nnz[i]++; 29758af7cee1SJed Brown } 29768af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2977ec7775f6SShri Abhyankar } 2978ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2979ec7775f6SShri Abhyankar } 2980ec7775f6SShri Abhyankar 2981d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 2982d71ae5a4SJacob Faibussowitsch { 2983b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2984b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 2985b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 2986b264fe52SHong Zhang 2987b264fe52SHong Zhang PetscFunctionBegin; 2988b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 29899566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 2990b264fe52SHong Zhang PetscFunctionReturn(0); 2991b264fe52SHong Zhang } 2992b264fe52SHong Zhang 2993d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 2994d71ae5a4SJacob Faibussowitsch { 2995ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 2996ac90fabeSBarry Smith 2997ac90fabeSBarry Smith PetscFunctionBegin; 2998134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 2999134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3000134adf20SPierre Jolivet if (e) { 30019566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 300281fa06acSBarry Smith if (e) { 30039566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3004134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 300581fa06acSBarry Smith } 300681fa06acSBarry Smith } 300754c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 300881fa06acSBarry Smith } 3009ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30102e5835c6SStefano Zampini const PetscScalar *xa; 30112e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 301281fa06acSBarry Smith PetscBLASInt one = 1, bnz; 301381fa06acSBarry Smith 30149566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3017792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30209566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30229566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3023ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30249566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3025ac90fabeSBarry Smith } else { 30268229c054SShri Abhyankar Mat B; 30278229c054SShri Abhyankar PetscInt *nnz; 30289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30299566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30309566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30319566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30329566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30339566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30359566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30369566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30379bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30389566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3039ac90fabeSBarry Smith } 3040ac90fabeSBarry Smith PetscFunctionReturn(0); 3041ac90fabeSBarry Smith } 3042ac90fabeSBarry Smith 3043d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3044d71ae5a4SJacob Faibussowitsch { 3045354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3046354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3047354c94deSBarry Smith PetscInt i, nz; 3048354c94deSBarry Smith PetscScalar *a; 3049354c94deSBarry Smith 3050354c94deSBarry Smith PetscFunctionBegin; 3051354c94deSBarry Smith nz = aij->nz; 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30532205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3055354c94deSBarry Smith #else 3056354c94deSBarry Smith PetscFunctionBegin; 3057354c94deSBarry Smith #endif 3058354c94deSBarry Smith PetscFunctionReturn(0); 3059354c94deSBarry Smith } 3060354c94deSBarry Smith 3061d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3062d71ae5a4SJacob Faibussowitsch { 3063e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3064d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3065e34fafa9SBarry Smith PetscReal atmp; 3066985db425SBarry Smith PetscScalar *x; 3067ce496241SStefano Zampini const MatScalar *aa, *av; 3068e34fafa9SBarry Smith 3069e34fafa9SBarry Smith PetscFunctionBegin; 307028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3072ce496241SStefano Zampini aa = av; 3073e34fafa9SBarry Smith ai = a->i; 3074e34fafa9SBarry Smith aj = a->j; 3075e34fafa9SBarry Smith 30769566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 30779566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30789566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 307908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3080e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30819371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30829371c9d4SSatish Balay ai++; 3083e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3084985db425SBarry Smith atmp = PetscAbsScalar(*aa); 30859371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 30869371c9d4SSatish Balay x[i] = atmp; 30879371c9d4SSatish Balay if (idx) idx[i] = *aj; 30889371c9d4SSatish Balay } 30899371c9d4SSatish Balay aa++; 30909371c9d4SSatish Balay aj++; 3091985db425SBarry Smith } 3092985db425SBarry Smith } 30939566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 30949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3095985db425SBarry Smith PetscFunctionReturn(0); 3096985db425SBarry Smith } 3097985db425SBarry Smith 3098d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3099d71ae5a4SJacob Faibussowitsch { 3100985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3101d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3102985db425SBarry Smith PetscScalar *x; 3103ce496241SStefano Zampini const MatScalar *aa, *av; 3104985db425SBarry Smith 3105985db425SBarry Smith PetscFunctionBegin; 310628b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3108ce496241SStefano Zampini aa = av; 3109985db425SBarry Smith ai = a->i; 3110985db425SBarry Smith aj = a->j; 3111985db425SBarry Smith 31129566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31139566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31149566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3116985db425SBarry Smith for (i = 0; i < m; i++) { 31179371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31189371c9d4SSatish Balay ai++; 3119d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31209371c9d4SSatish Balay x[i] = *aa; 31219371c9d4SSatish Balay if (idx) idx[i] = 0; 3122985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3123985db425SBarry Smith x[i] = 0.0; 3124985db425SBarry Smith if (idx) { 3125985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3126985db425SBarry Smith if (aj[j] > j) { 3127985db425SBarry Smith idx[i] = j; 3128985db425SBarry Smith break; 3129985db425SBarry Smith } 3130985db425SBarry Smith } 31311a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31321a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3133985db425SBarry Smith } 3134985db425SBarry Smith } 3135985db425SBarry Smith for (j = 0; j < ncols; j++) { 31369371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31379371c9d4SSatish Balay x[i] = *aa; 31389371c9d4SSatish Balay if (idx) idx[i] = *aj; 31399371c9d4SSatish Balay } 31409371c9d4SSatish Balay aa++; 31419371c9d4SSatish Balay aj++; 3142985db425SBarry Smith } 3143985db425SBarry Smith } 31449566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3146985db425SBarry Smith PetscFunctionReturn(0); 3147985db425SBarry Smith } 3148985db425SBarry Smith 3149d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3150d71ae5a4SJacob Faibussowitsch { 3151c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3152c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3153ce496241SStefano Zampini PetscScalar *x; 3154ce496241SStefano Zampini const MatScalar *aa, *av; 3155c87e5d42SMatthew Knepley 3156c87e5d42SMatthew Knepley PetscFunctionBegin; 31579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3158ce496241SStefano Zampini aa = av; 3159c87e5d42SMatthew Knepley ai = a->i; 3160c87e5d42SMatthew Knepley aj = a->j; 3161c87e5d42SMatthew Knepley 31629566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31639566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31649566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316508401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3166c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 31679371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31689371c9d4SSatish Balay ai++; 3169f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 31709371c9d4SSatish Balay x[i] = *aa; 31719371c9d4SSatish Balay if (idx) idx[i] = 0; 3172f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3173f07e67edSHong Zhang x[i] = 0.0; 3174f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3175289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3176f07e67edSHong Zhang if (aj[j] > j) { 3177f07e67edSHong Zhang idx[i] = j; 31782205254eSKarl Rupp break; 31792205254eSKarl Rupp } 3180289a08f5SMatthew Knepley } 3181f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3182f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3183f07e67edSHong Zhang } 3184289a08f5SMatthew Knepley } 3185c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 31869371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 31879371c9d4SSatish Balay x[i] = *aa; 31889371c9d4SSatish Balay if (idx) idx[i] = *aj; 31899371c9d4SSatish Balay } 31909371c9d4SSatish Balay aa++; 31919371c9d4SSatish Balay aj++; 3192c87e5d42SMatthew Knepley } 3193c87e5d42SMatthew Knepley } 31949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3196c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3197c87e5d42SMatthew Knepley } 3198c87e5d42SMatthew Knepley 3199d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3200d71ae5a4SJacob Faibussowitsch { 3201985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3202d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3203d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3204985db425SBarry Smith PetscScalar *x; 3205ce496241SStefano Zampini const MatScalar *aa, *av; 3206985db425SBarry Smith 3207985db425SBarry Smith PetscFunctionBegin; 320828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3210ce496241SStefano Zampini aa = av; 3211985db425SBarry Smith ai = a->i; 3212985db425SBarry Smith aj = a->j; 3213985db425SBarry Smith 32149566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32159566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32169566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321708401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3218985db425SBarry Smith for (i = 0; i < m; i++) { 32199371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32209371c9d4SSatish Balay ai++; 3221d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32229371c9d4SSatish Balay x[i] = *aa; 32239371c9d4SSatish Balay if (idx) idx[i] = 0; 3224985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3225985db425SBarry Smith x[i] = 0.0; 3226985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3227985db425SBarry Smith for (j = 0; j < ncols; j++) { 3228985db425SBarry Smith if (aj[j] > j) { 3229985db425SBarry Smith idx[i] = j; 3230985db425SBarry Smith break; 3231985db425SBarry Smith } 3232985db425SBarry Smith } 3233fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3234fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3235985db425SBarry Smith } 3236985db425SBarry Smith } 3237985db425SBarry Smith for (j = 0; j < ncols; j++) { 32389371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32399371c9d4SSatish Balay x[i] = *aa; 32409371c9d4SSatish Balay if (idx) idx[i] = *aj; 32419371c9d4SSatish Balay } 32429371c9d4SSatish Balay aa++; 32439371c9d4SSatish Balay aj++; 3244e34fafa9SBarry Smith } 3245e34fafa9SBarry Smith } 32469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3248e34fafa9SBarry Smith PetscFunctionReturn(0); 3249e34fafa9SBarry Smith } 3250bbead8a2SBarry Smith 3251d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3252d71ae5a4SJacob Faibussowitsch { 3253bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 325433d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3255bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32560da83c2eSBarry Smith const PetscReal shift = 0.0; 32571a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3258bbead8a2SBarry Smith 3259bbead8a2SBarry Smith PetscFunctionBegin; 3260a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32614a0d0026SBarry Smith if (a->ibdiagvalid) { 32624a0d0026SBarry Smith if (values) *values = a->ibdiag; 32634a0d0026SBarry Smith PetscFunctionReturn(0); 32644a0d0026SBarry Smith } 32659566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 32664dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3267bbead8a2SBarry Smith diag = a->ibdiag; 3268bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3269bbead8a2SBarry Smith /* factor and invert each block */ 3270bbead8a2SBarry Smith switch (bs) { 3271bbead8a2SBarry Smith case 1: 3272bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3274ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3275ec1892c8SHong Zhang if (allowzeropivot) { 32767b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32777b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32787b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32799566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 328098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3281ec1892c8SHong Zhang } 3282bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3283bbead8a2SBarry Smith } 3284bbead8a2SBarry Smith break; 3285bbead8a2SBarry Smith case 2: 3286bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32879371c9d4SSatish Balay ij[0] = 2 * i; 32889371c9d4SSatish Balay ij[1] = 2 * i + 1; 32899566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 32909566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 32917b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3293bbead8a2SBarry Smith diag += 4; 3294bbead8a2SBarry Smith } 3295bbead8a2SBarry Smith break; 3296bbead8a2SBarry Smith case 3: 3297bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 32989371c9d4SSatish Balay ij[0] = 3 * i; 32999371c9d4SSatish Balay ij[1] = 3 * i + 1; 33009371c9d4SSatish Balay ij[2] = 3 * i + 2; 33019566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33029566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33037b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33049566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3305bbead8a2SBarry Smith diag += 9; 3306bbead8a2SBarry Smith } 3307bbead8a2SBarry Smith break; 3308bbead8a2SBarry Smith case 4: 3309bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33109371c9d4SSatish Balay ij[0] = 4 * i; 33119371c9d4SSatish Balay ij[1] = 4 * i + 1; 33129371c9d4SSatish Balay ij[2] = 4 * i + 2; 33139371c9d4SSatish Balay ij[3] = 4 * i + 3; 33149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33159566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33167b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33179566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3318bbead8a2SBarry Smith diag += 16; 3319bbead8a2SBarry Smith } 3320bbead8a2SBarry Smith break; 3321bbead8a2SBarry Smith case 5: 3322bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33239371c9d4SSatish Balay ij[0] = 5 * i; 33249371c9d4SSatish Balay ij[1] = 5 * i + 1; 33259371c9d4SSatish Balay ij[2] = 5 * i + 2; 33269371c9d4SSatish Balay ij[3] = 5 * i + 3; 33279371c9d4SSatish Balay ij[4] = 5 * i + 4; 33289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33307b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3332bbead8a2SBarry Smith diag += 25; 3333bbead8a2SBarry Smith } 3334bbead8a2SBarry Smith break; 3335bbead8a2SBarry Smith case 6: 3336bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33379371c9d4SSatish Balay ij[0] = 6 * i; 33389371c9d4SSatish Balay ij[1] = 6 * i + 1; 33399371c9d4SSatish Balay ij[2] = 6 * i + 2; 33409371c9d4SSatish Balay ij[3] = 6 * i + 3; 33419371c9d4SSatish Balay ij[4] = 6 * i + 4; 33429371c9d4SSatish Balay ij[5] = 6 * i + 5; 33439566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33457b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3347bbead8a2SBarry Smith diag += 36; 3348bbead8a2SBarry Smith } 3349bbead8a2SBarry Smith break; 3350bbead8a2SBarry Smith case 7: 3351bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33529371c9d4SSatish Balay ij[0] = 7 * i; 33539371c9d4SSatish Balay ij[1] = 7 * i + 1; 33549371c9d4SSatish Balay ij[2] = 7 * i + 2; 33559371c9d4SSatish Balay ij[3] = 7 * i + 3; 33569371c9d4SSatish Balay ij[4] = 7 * i + 4; 33579371c9d4SSatish Balay ij[5] = 7 * i + 5; 33589371c9d4SSatish Balay ij[5] = 7 * i + 6; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3363bbead8a2SBarry Smith diag += 49; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith default: 33679566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3368bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3369ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 33709566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 33719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 33727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3374bbead8a2SBarry Smith diag += bs2; 3375bbead8a2SBarry Smith } 33769566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3377bbead8a2SBarry Smith } 3378bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3379bbead8a2SBarry Smith PetscFunctionReturn(0); 3380bbead8a2SBarry Smith } 3381bbead8a2SBarry Smith 3382d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3383d71ae5a4SJacob Faibussowitsch { 338473a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3385fff043a9SJunchao Zhang PetscScalar a, *aa; 338673a71a0fSBarry Smith PetscInt m, n, i, j, col; 338773a71a0fSBarry Smith 338873a71a0fSBarry Smith PetscFunctionBegin; 338973a71a0fSBarry Smith if (!x->assembled) { 33909566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 339173a71a0fSBarry Smith for (i = 0; i < m; i++) { 339273a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 33939566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 339473a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 33959566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 339673a71a0fSBarry Smith } 339773a71a0fSBarry Smith } 3398e2ce353bSJunchao Zhang } else { 33999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34009566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3402e2ce353bSJunchao Zhang } 34039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 340573a71a0fSBarry Smith PetscFunctionReturn(0); 340673a71a0fSBarry Smith } 340773a71a0fSBarry Smith 3408679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3409d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3410d71ae5a4SJacob Faibussowitsch { 3411679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3412679944adSJunchao Zhang PetscScalar a; 3413679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3414679944adSJunchao Zhang 3415679944adSJunchao Zhang PetscFunctionBegin; 3416679944adSJunchao Zhang nskip = high - low; 34179566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3418679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3419679944adSJunchao Zhang for (i = 0; i < m; i++) { 3420679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34219566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3422679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3423679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34249566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3425679944adSJunchao Zhang } 3426e2ce353bSJunchao Zhang } 34279566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34289566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 3429679944adSJunchao Zhang PetscFunctionReturn(0); 3430679944adSJunchao Zhang } 3431679944adSJunchao Zhang 3432682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34330a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3434cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3435cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3436cb5b572fSBarry Smith MatMult_SeqAIJ, 343797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34387c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34397c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3440f4259b30SLisandro Dalcin NULL, 3441f4259b30SLisandro Dalcin NULL, 3442f4259b30SLisandro Dalcin NULL, 3443f4259b30SLisandro Dalcin /* 10*/ NULL, 3444cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3445f4259b30SLisandro Dalcin NULL, 344641f059aeSBarry Smith MatSOR_SeqAIJ, 344791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 344897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3449cb5b572fSBarry Smith MatEqual_SeqAIJ, 3450cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3451cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3452cb5b572fSBarry Smith MatNorm_SeqAIJ, 3453f4259b30SLisandro Dalcin /* 20*/ NULL, 3454cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3455cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3456cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3457d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3458f4259b30SLisandro Dalcin NULL, 3459f4259b30SLisandro Dalcin NULL, 3460f4259b30SLisandro Dalcin NULL, 3461f4259b30SLisandro Dalcin NULL, 34624994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3463f4259b30SLisandro Dalcin NULL, 3464f4259b30SLisandro Dalcin NULL, 3465f4259b30SLisandro Dalcin NULL, 3466f4259b30SLisandro Dalcin NULL, 3467d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3468f4259b30SLisandro Dalcin NULL, 3469f4259b30SLisandro Dalcin NULL, 3470cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3471f4259b30SLisandro Dalcin NULL, 3472d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34737dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3474cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3475cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3476cb5b572fSBarry Smith MatCopy_SeqAIJ, 3477d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3478cb5b572fSBarry Smith MatScale_SeqAIJ, 34797d68702bSBarry Smith MatShift_SeqAIJ, 348079299369SBarry Smith MatDiagonalSet_SeqAIJ, 34816e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 348273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34833b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34843b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34853b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3486a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 348793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3488f4259b30SLisandro Dalcin NULL, 3489f4259b30SLisandro Dalcin NULL, 3490cda55fadSBarry Smith MatPermute_SeqAIJ, 3491f4259b30SLisandro Dalcin NULL, 3492f4259b30SLisandro Dalcin /* 59*/ NULL, 3493b9b97703SBarry Smith MatDestroy_SeqAIJ, 3494b9b97703SBarry Smith MatView_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin /* 64*/ NULL, 3498321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3503c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin /* 74*/ NULL, 35083acb8795SBarry Smith MatFDColoringApply_AIJ, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 35126ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516bc011b1eSHong Zhang MatLoad_SeqAIJ, 3517d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35181cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521f4259b30SLisandro Dalcin NULL, 3522f4259b30SLisandro Dalcin /* 89*/ NULL, 3523f4259b30SLisandro Dalcin NULL, 352426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526f4259b30SLisandro Dalcin NULL, 35278fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 35306fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3531f4259b30SLisandro Dalcin NULL, 35324222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin NULL, 353587d4246cSBarry Smith MatConjugate_SeqAIJ, 3536f4259b30SLisandro Dalcin NULL, 3537d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 353899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3539f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 3542cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 35442af78befSBarry Smith MatGetRowMin_SeqAIJ, 3545f4259b30SLisandro Dalcin NULL, 3546599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3547f4259b30SLisandro Dalcin /*114*/ NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin /*119*/ NULL, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35570716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3558a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 355937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35600da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin /*129*/ NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 356575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3566b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3567b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35682b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 35713964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3572f4259b30SLisandro Dalcin /*139*/ NULL, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 35753a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35769c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35774222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35784222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 358072833a62Smarkadams4 NULL, 358172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 35822d776b49SBarry Smith NULL, 3583*dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3584*dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 358517ab2063SBarry Smith 3586d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3587d71ae5a4SJacob Faibussowitsch { 3588bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 358997f1f81fSBarry Smith PetscInt i, nz, n; 3590bef8e0ddSBarry Smith 3591bef8e0ddSBarry Smith PetscFunctionBegin; 3592bef8e0ddSBarry Smith nz = aij->maxnz; 3593d0f46423SBarry Smith n = mat->rmap->n; 3594ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3595bef8e0ddSBarry Smith aij->nz = nz; 3596ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 3597bef8e0ddSBarry Smith PetscFunctionReturn(0); 3598bef8e0ddSBarry Smith } 3599bef8e0ddSBarry Smith 3600a3bb6f32SFande Kong /* 3601ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3602ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3603ddea5d60SJunchao Zhang */ 3604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3605d71ae5a4SJacob Faibussowitsch { 3606a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3607a3bb6f32SFande Kong PetscTable gid1_lid1; 3608a3bb6f32SFande Kong PetscTablePosition tpos; 360925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 361025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3611a3bb6f32SFande Kong 3612a3bb6f32SFande Kong PetscFunctionBegin; 3613a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3614a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3615a3bb6f32SFande Kong /* use a table */ 36169566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1)); 3617a3bb6f32SFande Kong ec = 0; 361825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 361925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 36209566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &data)); 3621a3bb6f32SFande Kong if (!data) { 3622a3bb6f32SFande Kong /* one based table */ 36239566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES)); 3624a3bb6f32SFande Kong } 3625a3bb6f32SFande Kong } 3626a3bb6f32SFande Kong /* form array of columns we need */ 36279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 36289566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos)); 3629a3bb6f32SFande Kong while (tpos) { 36309566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid)); 3631a3bb6f32SFande Kong gid--; 3632a3bb6f32SFande Kong lid--; 3633a3bb6f32SFande Kong garray[lid] = gid; 3634a3bb6f32SFande Kong } 36359566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 36369566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 363748a46eb9SPierre Jolivet for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES)); 3638a3bb6f32SFande Kong /* compact out the extra columns in B */ 363925b670f0SStefano Zampini for (i = 0; i < nz; i++) { 364025b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36419566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1, gid1, &lid)); 3642a3bb6f32SFande Kong lid--; 364325b670f0SStefano Zampini jj[i] = lid; 3644a3bb6f32SFande Kong } 36459566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36469566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36479566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36489566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36499566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 3650a3bb6f32SFande Kong PetscFunctionReturn(0); 3651a3bb6f32SFande Kong } 3652a3bb6f32SFande Kong 3653bef8e0ddSBarry Smith /*@ 3654bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3655bef8e0ddSBarry Smith in the matrix. 3656bef8e0ddSBarry Smith 3657bef8e0ddSBarry Smith Input Parameters: 365811a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3659bef8e0ddSBarry Smith - indices - the column indices 3660bef8e0ddSBarry Smith 366115091d37SBarry Smith Level: advanced 366215091d37SBarry Smith 3663bef8e0ddSBarry Smith Notes: 3664bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3665bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 366611a5261eSBarry Smith of the `MatSetValues()` operation. 3667bef8e0ddSBarry Smith 3668bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 366911a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3670bef8e0ddSBarry Smith 367111a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3672bef8e0ddSBarry Smith 3673b9617806SBarry Smith The indices should start with zero, not one. 3674b9617806SBarry Smith 3675bef8e0ddSBarry Smith @*/ 3676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3677d71ae5a4SJacob Faibussowitsch { 3678bef8e0ddSBarry Smith PetscFunctionBegin; 36790700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3680dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3681cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 3682bef8e0ddSBarry Smith PetscFunctionReturn(0); 3683bef8e0ddSBarry Smith } 3684bef8e0ddSBarry Smith 3685be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3686be6bf707SBarry Smith 3687d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3688d71ae5a4SJacob Faibussowitsch { 3689be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3690d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3691be6bf707SBarry Smith 3692be6bf707SBarry Smith PetscFunctionBegin; 369328b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3694be6bf707SBarry Smith 3695be6bf707SBarry Smith /* allocate space for values if not already there */ 36964dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3697be6bf707SBarry Smith 3698be6bf707SBarry Smith /* copy values over */ 36999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 3700be6bf707SBarry Smith PetscFunctionReturn(0); 3701be6bf707SBarry Smith } 3702be6bf707SBarry Smith 3703be6bf707SBarry Smith /*@ 3704be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3705be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3706be6bf707SBarry Smith nonlinear portion. 3707be6bf707SBarry Smith 370811a5261eSBarry Smith Collect on mat 3709be6bf707SBarry Smith 3710be6bf707SBarry Smith Input Parameters: 371111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3712be6bf707SBarry Smith 371315091d37SBarry Smith Level: advanced 371415091d37SBarry Smith 371511a5261eSBarry Smith Common Usage, with `SNESSolve()`: 3716be6bf707SBarry Smith $ Create Jacobian matrix 3717be6bf707SBarry Smith $ Set linear terms into matrix 3718be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3719be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3720be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3721512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3722be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3723be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3724be6bf707SBarry Smith $ In your Jacobian routine 3725be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3726be6bf707SBarry Smith $ Set nonlinear terms in matrix 3727be6bf707SBarry Smith 3728be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3729be6bf707SBarry Smith $ // build linear portion of Jacobian 3730512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3731be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3732be6bf707SBarry Smith $ loop over nonlinear iterations 3733be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3734be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3735be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3736be6bf707SBarry Smith $ Solve linear system with Jacobian 3737be6bf707SBarry Smith $ endloop 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith Notes: 3740be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 374111a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3742be6bf707SBarry Smith calling this routine. 3743be6bf707SBarry Smith 37440c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37450c468ba9SBarry Smith and does not allocated additional space. 37460c468ba9SBarry Smith 3747db781477SPatrick Sanan .seealso: `MatRetrieveValues()` 3748be6bf707SBarry Smith @*/ 3749d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3750d71ae5a4SJacob Faibussowitsch { 3751be6bf707SBarry Smith PetscFunctionBegin; 37520700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 375328b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 375428b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3755cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 3756be6bf707SBarry Smith PetscFunctionReturn(0); 3757be6bf707SBarry Smith } 3758be6bf707SBarry Smith 3759d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3760d71ae5a4SJacob Faibussowitsch { 3761be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3762d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3763be6bf707SBarry Smith 3764be6bf707SBarry Smith PetscFunctionBegin; 376528b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 376628b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3767be6bf707SBarry Smith /* copy values over */ 37689566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 3769be6bf707SBarry Smith PetscFunctionReturn(0); 3770be6bf707SBarry Smith } 3771be6bf707SBarry Smith 3772be6bf707SBarry Smith /*@ 3773be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3774be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3775be6bf707SBarry Smith nonlinear portion. 3776be6bf707SBarry Smith 377711a5261eSBarry Smith Collect on mat 3778be6bf707SBarry Smith 3779be6bf707SBarry Smith Input Parameters: 378011a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3781be6bf707SBarry Smith 378215091d37SBarry Smith Level: advanced 378315091d37SBarry Smith 3784db781477SPatrick Sanan .seealso: `MatStoreValues()` 3785be6bf707SBarry Smith @*/ 3786d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3787d71ae5a4SJacob Faibussowitsch { 3788be6bf707SBarry Smith PetscFunctionBegin; 37890700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3792cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 3793be6bf707SBarry Smith PetscFunctionReturn(0); 3794be6bf707SBarry Smith } 3795be6bf707SBarry Smith 3796be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 379717ab2063SBarry Smith /*@C 379811a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 37990d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38006e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 380151c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38022bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 380317ab2063SBarry Smith 3804d083f849SBarry Smith Collective 3805db81eaa0SLois Curfman McInnes 380617ab2063SBarry Smith Input Parameters: 380711a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 380817ab2063SBarry Smith . m - number of rows 380917ab2063SBarry Smith . n - number of columns 381017ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 381151c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38120298fd71SBarry Smith (possibly different for each row) or NULL 381317ab2063SBarry Smith 381417ab2063SBarry Smith Output Parameter: 3815416022c9SBarry Smith . A - the matrix 381617ab2063SBarry Smith 381711a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3818f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 381911a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3820175b88e8SBarry Smith 3821b259b22eSLois Curfman McInnes Notes: 382249a6f317SBarry Smith If nnz is given then nz is ignored 382349a6f317SBarry Smith 382411a5261eSBarry Smith The AIJ format, also called 382511a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38260002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 382744cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 382817ab2063SBarry Smith 382917ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 383011a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38313d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38326da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 383317ab2063SBarry Smith 3834682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38354fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3836682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38376c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38386c7ebb05SLois Curfman McInnes 38396c7ebb05SLois Curfman McInnes Options Database Keys: 3840698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38419db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 384217ab2063SBarry Smith 3843027ccd11SLois Curfman McInnes Level: intermediate 3844027ccd11SLois Curfman McInnes 384560161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 384617ab2063SBarry Smith @*/ 3847d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3848d71ae5a4SJacob Faibussowitsch { 38493a40ed3dSBarry Smith PetscFunctionBegin; 38509566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38519566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38529566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 3854273d9f13SBarry Smith PetscFunctionReturn(0); 3855273d9f13SBarry Smith } 3856273d9f13SBarry Smith 3857273d9f13SBarry Smith /*@C 3858273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3859273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3860273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3861273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3862273d9f13SBarry Smith 3863d083f849SBarry Smith Collective 3864273d9f13SBarry Smith 3865273d9f13SBarry Smith Input Parameters: 38661c4f3114SJed Brown + B - The matrix 3867273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3868273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38690298fd71SBarry Smith (possibly different for each row) or NULL 3870273d9f13SBarry Smith 3871273d9f13SBarry Smith Notes: 387249a6f317SBarry Smith If nnz is given then nz is ignored 387349a6f317SBarry Smith 387411a5261eSBarry Smith The `MATSEQAIJ` format also called 387511a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3876273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3877273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3878273d9f13SBarry Smith 3879273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 388011a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3881273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3882273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3883273d9f13SBarry Smith 388411a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3885aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3886aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3887aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3888aa95bbe8SBarry Smith 388911a5261eSBarry Smith Developer Notes: 389011a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3891a96a251dSBarry Smith entries or columns indices 3892a96a251dSBarry Smith 3893273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3894273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3895273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3896273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3897273d9f13SBarry Smith 3898273d9f13SBarry Smith Options Database Keys: 3899698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 390047b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3901273d9f13SBarry Smith 3902273d9f13SBarry Smith Level: intermediate 3903273d9f13SBarry Smith 3904db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3905db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3906273d9f13SBarry Smith @*/ 3907d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3908d71ae5a4SJacob Faibussowitsch { 3909a23d5eceSKris Buschelman PetscFunctionBegin; 39106ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39116ba663aaSJed Brown PetscValidType(B, 1); 3912cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 3913a23d5eceSKris Buschelman PetscFunctionReturn(0); 3914a23d5eceSKris Buschelman } 3915a23d5eceSKris Buschelman 3916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3917d71ae5a4SJacob Faibussowitsch { 3918273d9f13SBarry Smith Mat_SeqAIJ *b; 39192576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 392097f1f81fSBarry Smith PetscInt i; 3921273d9f13SBarry Smith 3922273d9f13SBarry Smith PetscFunctionBegin; 39232576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3924a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3925c461c341SBarry Smith skipallocation = PETSC_TRUE; 3926c461c341SBarry Smith nz = 0; 3927c461c341SBarry Smith } 39289566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3930899cda47SBarry Smith 3931435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 393208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3933cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3934d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 393508401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 393608401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3937b73539f3SBarry Smith } 3938b73539f3SBarry Smith } 3939b73539f3SBarry Smith 3940273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39412205254eSKarl Rupp 3942273d9f13SBarry Smith b = (Mat_SeqAIJ *)B->data; 3943273d9f13SBarry Smith 3944ab93d7beSBarry Smith if (!skipallocation) { 39454dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3946071fcb05SBarry Smith if (!b->ilen) { 3947071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39489566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3949071fcb05SBarry Smith } else { 39509566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39512ee49352SLisandro Dalcin } 39524dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 3953273d9f13SBarry Smith if (!nnz) { 3954435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3955c62bd62aSJed Brown else if (nz < 0) nz = 1; 39565d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3957d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3958d0f46423SBarry Smith nz = nz * B->rmap->n; 3959273d9f13SBarry Smith } else { 3960c73702f5SBarry Smith PetscInt64 nz64 = 0; 39619371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 39629371c9d4SSatish Balay b->imax[i] = nnz[i]; 39639371c9d4SSatish Balay nz64 += nnz[i]; 39649371c9d4SSatish Balay } 39659566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 3966273d9f13SBarry Smith } 3967ab93d7beSBarry Smith 3968273d9f13SBarry Smith /* allocate the matrix space */ 396953dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39709566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 3971396832f4SHong Zhang if (B->structure_only) { 39729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 39739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 3974396832f4SHong Zhang } else { 39759566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 3976396832f4SHong Zhang } 3977bfeeae90SHong Zhang b->i[0] = 0; 3978ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 3979396832f4SHong Zhang if (B->structure_only) { 3980396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3981396832f4SHong Zhang b->free_a = PETSC_FALSE; 3982396832f4SHong Zhang } else { 3983273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3984e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3985396832f4SHong Zhang } 3986e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3987c461c341SBarry Smith } else { 3988e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3989e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3990c461c341SBarry Smith } 3991273d9f13SBarry Smith 3992846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3993846b4da1SFande Kong /* reserve user-requested sparsity */ 39949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 3995846b4da1SFande Kong } 3996846b4da1SFande Kong 3997273d9f13SBarry Smith b->nz = 0; 3998273d9f13SBarry Smith b->maxnz = nz; 3999273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40001baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4001cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4002cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40035519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40045519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40055519a089SJose E. Roman */ 40065519a089SJose E. Roman B->nonzerostate++; 4007273d9f13SBarry Smith PetscFunctionReturn(0); 4008273d9f13SBarry Smith } 4009273d9f13SBarry Smith 4010d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4011d71ae5a4SJacob Faibussowitsch { 4012846b4da1SFande Kong Mat_SeqAIJ *a; 4013a5bbaf83SFande Kong PetscInt i; 4014846b4da1SFande Kong 4015846b4da1SFande Kong PetscFunctionBegin; 4016846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 401714d0e64fSAlex Lindsay 401814d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 401914d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 402014d0e64fSAlex Lindsay 4021846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40222c814fdeSFande Kong /* if no saved info, we error out */ 402328b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40242c814fdeSFande Kong 4025aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40262c814fdeSFande Kong 40279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4029846b4da1SFande Kong a->i[0] = 0; 4030ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4031846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4032846b4da1SFande Kong a->nz = 0; 4033846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4034846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4035846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4036846b4da1SFande Kong A->assembled = PETSC_FALSE; 4037846b4da1SFande Kong PetscFunctionReturn(0); 4038846b4da1SFande Kong } 4039846b4da1SFande Kong 404058d36128SBarry Smith /*@ 404111a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4042a1661176SMatthew Knepley 4043a1661176SMatthew Knepley Input Parameters: 4044a1661176SMatthew Knepley + B - the matrix 4045a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4046a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4047a1661176SMatthew Knepley - v - optional values in the matrix 4048a1661176SMatthew Knepley 4049a1661176SMatthew Knepley Level: developer 4050a1661176SMatthew Knepley 40516a9b8d82SBarry Smith Notes: 405211a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 405358d36128SBarry Smith 40546a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40556a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40566a9b8d82SBarry Smith 40576a9b8d82SBarry Smith Developer Notes: 40586a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 405911a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 40606a9b8d82SBarry Smith 406111a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 40626a9b8d82SBarry Smith 4063db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4064a1661176SMatthew Knepley @*/ 4065d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4066d71ae5a4SJacob Faibussowitsch { 4067a1661176SMatthew Knepley PetscFunctionBegin; 40680700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 40696ba663aaSJed Brown PetscValidType(B, 1); 4070cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 4071a1661176SMatthew Knepley PetscFunctionReturn(0); 4072a1661176SMatthew Knepley } 4073a1661176SMatthew Knepley 4074d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4075d71ae5a4SJacob Faibussowitsch { 4076a1661176SMatthew Knepley PetscInt i; 4077a1661176SMatthew Knepley PetscInt m, n; 4078a1661176SMatthew Knepley PetscInt nz; 40796a9b8d82SBarry Smith PetscInt *nnz; 4080a1661176SMatthew Knepley 4081a1661176SMatthew Knepley PetscFunctionBegin; 4082aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4083779a8d59SSatish Balay 40849566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 40859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4086779a8d59SSatish Balay 40879566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 40889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4089a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4090b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 409108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4092a1661176SMatthew Knepley nnz[i] = nz; 4093a1661176SMatthew Knepley } 40949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 40959566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4096a1661176SMatthew Knepley 409748a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4098a1661176SMatthew Knepley 40999566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41009566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4101a1661176SMatthew Knepley 41029566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 4103a1661176SMatthew Knepley PetscFunctionReturn(0); 4104a1661176SMatthew Knepley } 4105a1661176SMatthew Knepley 4106ad7e164aSPierre Jolivet /*@ 4107ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4108ad7e164aSPierre Jolivet 4109ad7e164aSPierre Jolivet Input Parameters: 4110ad7e164aSPierre Jolivet + A - left-hand side matrix 4111ad7e164aSPierre Jolivet . B - right-hand side matrix 411211a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4113ad7e164aSPierre Jolivet 4114ad7e164aSPierre Jolivet Output Parameter: 4115ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4116ad7e164aSPierre Jolivet 4117ad7e164aSPierre Jolivet Level: intermediate 4118ad7e164aSPierre Jolivet 411911a5261eSBarry Smith Note: 412011a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4121ad7e164aSPierre Jolivet 4122db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4123ad7e164aSPierre Jolivet @*/ 4124d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4125d71ae5a4SJacob Faibussowitsch { 4126ad7e164aSPierre Jolivet PetscFunctionBegin; 4127ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4128ad7e164aSPierre Jolivet PetscValidType(A, 1); 4129ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4130ad7e164aSPierre Jolivet PetscValidType(B, 2); 4131ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4132ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4133ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4134ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4135ad7e164aSPierre Jolivet } 4136cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 4137ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4138ad7e164aSPierre Jolivet } 4139ad7e164aSPierre Jolivet 4140d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4141d71ae5a4SJacob Faibussowitsch { 4142ad7e164aSPierre Jolivet Mat newmat; 4143ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4144ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4145ad7e164aSPierre Jolivet PetscScalar *v; 4146fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4147ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4148ad7e164aSPierre Jolivet PetscBool flg; 4149ad7e164aSPierre Jolivet 4150ad7e164aSPierre Jolivet PetscFunctionBegin; 415128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415228b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 415328b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 415428b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41559566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 415628b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4157aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4158ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41599566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 41609566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 41619566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 41629566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4163ad7e164aSPierre Jolivet i[0] = 0; 4164ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4165ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4166ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4167ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4168ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4169ad7e164aSPierre Jolivet } 4170ad7e164aSPierre Jolivet } 4171ad7e164aSPierre Jolivet } 41729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4173ad7e164aSPierre Jolivet *C = newmat; 41749566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4175ad7e164aSPierre Jolivet nnz = 0; 4176ad7e164aSPierre Jolivet } 41779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 41789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 41799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4180ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4181ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4182ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4183ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4184ad7e164aSPierre Jolivet } 4185ad7e164aSPierre Jolivet } 4186ad7e164aSPierre Jolivet } 41879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 41889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 41899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 4190ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4191ad7e164aSPierre Jolivet } 4192ad7e164aSPierre Jolivet 4193c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4194af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4195170fe5c8SBarry Smith 4196170fe5c8SBarry Smith /* 4197170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4198170fe5c8SBarry Smith 4199170fe5c8SBarry Smith n p p 42002da392ccSBarry Smith [ ] [ ] [ ] 42012da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42022da392ccSBarry Smith [ ] [ ] [ ] 4203170fe5c8SBarry Smith 4204170fe5c8SBarry Smith */ 4205d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4206d71ae5a4SJacob Faibussowitsch { 4207170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4208170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4209170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 421086214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4211170fe5c8SBarry Smith const PetscInt *ii, *idx; 4212170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4213170fe5c8SBarry Smith PetscScalar *c, *c_q; 421486214ceeSStefano Zampini PetscInt clda = sub_c->lda; 421586214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4216170fe5c8SBarry Smith 4217170fe5c8SBarry Smith PetscFunctionBegin; 4218d0f46423SBarry Smith m = A->rmap->n; 4219d0f46423SBarry Smith n = A->cmap->n; 4220d0f46423SBarry Smith p = B->cmap->n; 4221170fe5c8SBarry Smith a = sub_a->v; 4222170fe5c8SBarry Smith b = sub_b->a; 4223170fe5c8SBarry Smith c = sub_c->v; 422486214ceeSStefano Zampini if (clda == m) { 42259566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 422686214ceeSStefano Zampini } else { 422786214ceeSStefano Zampini for (j = 0; j < p; j++) 42289371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 422986214ceeSStefano Zampini } 4230170fe5c8SBarry Smith ii = sub_b->i; 4231170fe5c8SBarry Smith idx = sub_b->j; 4232170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4233170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4234170fe5c8SBarry Smith while (q-- > 0) { 423586214ceeSStefano Zampini c_q = c + clda * (*idx); 423686214ceeSStefano Zampini a_q = a + alda * i; 4237854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4238170fe5c8SBarry Smith idx++; 4239170fe5c8SBarry Smith b++; 4240170fe5c8SBarry Smith } 4241170fe5c8SBarry Smith } 4242170fe5c8SBarry Smith PetscFunctionReturn(0); 4243170fe5c8SBarry Smith } 4244170fe5c8SBarry Smith 4245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4246d71ae5a4SJacob Faibussowitsch { 4247d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 424886214ceeSStefano Zampini PetscBool cisdense; 4249170fe5c8SBarry Smith 4250170fe5c8SBarry Smith PetscFunctionBegin; 425108401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42529566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42539566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 42549566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, "")); 425548a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42569566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4257d73949e8SHong Zhang 42584222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4259170fe5c8SBarry Smith PetscFunctionReturn(0); 4260170fe5c8SBarry Smith } 4261170fe5c8SBarry Smith 4262170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 42630bad9183SKris Buschelman /*MC 4264fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 42650bad9183SKris Buschelman based on compressed sparse row format. 42660bad9183SKris Buschelman 42670bad9183SKris Buschelman Options Database Keys: 42680bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 42690bad9183SKris Buschelman 42700bad9183SKris Buschelman Level: beginner 42710bad9183SKris Buschelman 42720cd7f59aSBarry Smith Notes: 427311a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 42740cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 42750cd7f59aSBarry Smith in the matrix 42760cd7f59aSBarry Smith 427711a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 427811a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 42790cd7f59aSBarry Smith 428011a5261eSBarry Smith Developer Note: 42810cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 42820cd7f59aSBarry Smith 4283db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 42840bad9183SKris Buschelman M*/ 42850bad9183SKris Buschelman 4286ccd284c7SBarry Smith /*MC 4287ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4288ccd284c7SBarry Smith 428911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 429011a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 429111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4292ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4293ccd284c7SBarry Smith the above preallocation routines for simplicity. 4294ccd284c7SBarry Smith 4295ccd284c7SBarry Smith Options Database Keys: 429611a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4297ccd284c7SBarry Smith 429811a5261eSBarry Smith Note: 429911a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4300ccd284c7SBarry Smith enough exist. 4301ccd284c7SBarry Smith 4302ccd284c7SBarry Smith Level: beginner 4303ccd284c7SBarry Smith 4304db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4305ccd284c7SBarry Smith M*/ 4306ccd284c7SBarry Smith 4307ccd284c7SBarry Smith /*MC 4308ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4309ccd284c7SBarry Smith 431011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 431111a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 431211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4313ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4314ccd284c7SBarry Smith the above preallocation routines for simplicity. 4315ccd284c7SBarry Smith 4316ccd284c7SBarry Smith Options Database Keys: 431711a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4318ccd284c7SBarry Smith 4319ccd284c7SBarry Smith Level: beginner 4320ccd284c7SBarry Smith 4321c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4322ccd284c7SBarry Smith M*/ 4323ccd284c7SBarry Smith 43247906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43257906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43267906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43277906f579SHong Zhang #endif 4328d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4329d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4330d24d4204SJose E. Roman #endif 43317906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43327906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43337906f579SHong Zhang #endif 43347906f579SHong Zhang 4335d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4336c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43374222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43387906f579SHong Zhang 43398c778c55SBarry Smith /*@C 434011a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43418c778c55SBarry Smith 43428c778c55SBarry Smith Not Collective 43438c778c55SBarry Smith 43448c778c55SBarry Smith Input Parameter: 434511a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43468c778c55SBarry Smith 43478c778c55SBarry Smith Output Parameter: 43488c778c55SBarry Smith . array - pointer to the data 43498c778c55SBarry Smith 43508c778c55SBarry Smith Level: intermediate 43518c778c55SBarry Smith 4352db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43538c778c55SBarry Smith @*/ 4354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4355d71ae5a4SJacob Faibussowitsch { 4356d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 43578c778c55SBarry Smith 43588c778c55SBarry Smith PetscFunctionBegin; 4359d67d9f35SJunchao Zhang if (aij->ops->getarray) { 43609566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4361d67d9f35SJunchao Zhang } else { 4362d67d9f35SJunchao Zhang *array = aij->a; 4363d67d9f35SJunchao Zhang } 4364d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4365d67d9f35SJunchao Zhang } 4366d67d9f35SJunchao Zhang 4367d67d9f35SJunchao Zhang /*@C 436811a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4369d67d9f35SJunchao Zhang 4370d67d9f35SJunchao Zhang Not Collective 4371d67d9f35SJunchao Zhang 4372d67d9f35SJunchao Zhang Input Parameters: 437311a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4374d67d9f35SJunchao Zhang - array - pointer to the data 4375d67d9f35SJunchao Zhang 4376d67d9f35SJunchao Zhang Level: intermediate 4377d67d9f35SJunchao Zhang 4378db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4379d67d9f35SJunchao Zhang @*/ 4380d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4381d71ae5a4SJacob Faibussowitsch { 4382d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4383d67d9f35SJunchao Zhang 4384d67d9f35SJunchao Zhang PetscFunctionBegin; 4385d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 43869566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4387d67d9f35SJunchao Zhang } else { 4388d67d9f35SJunchao Zhang *array = NULL; 4389d67d9f35SJunchao Zhang } 43909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 43919566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 43928c778c55SBarry Smith PetscFunctionReturn(0); 43938c778c55SBarry Smith } 43948c778c55SBarry Smith 439521e72a00SBarry Smith /*@C 439611a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 43978f1ea47aSStefano Zampini 43988f1ea47aSStefano Zampini Not Collective 43998f1ea47aSStefano Zampini 44008f1ea47aSStefano Zampini Input Parameter: 440111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44028f1ea47aSStefano Zampini 44038f1ea47aSStefano Zampini Output Parameter: 44048f1ea47aSStefano Zampini . array - pointer to the data 44058f1ea47aSStefano Zampini 44068f1ea47aSStefano Zampini Level: intermediate 44078f1ea47aSStefano Zampini 4408db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44098f1ea47aSStefano Zampini @*/ 4410d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4411d71ae5a4SJacob Faibussowitsch { 4412d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44138f1ea47aSStefano Zampini 44148f1ea47aSStefano Zampini PetscFunctionBegin; 4415d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44169566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4417d67d9f35SJunchao Zhang } else { 4418d67d9f35SJunchao Zhang *array = aij->a; 4419d67d9f35SJunchao Zhang } 44208f1ea47aSStefano Zampini PetscFunctionReturn(0); 44218f1ea47aSStefano Zampini } 44228f1ea47aSStefano Zampini 44238f1ea47aSStefano Zampini /*@C 442411a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44258f1ea47aSStefano Zampini 44268f1ea47aSStefano Zampini Not Collective 44278f1ea47aSStefano Zampini 44288f1ea47aSStefano Zampini Input Parameter: 442911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44308f1ea47aSStefano Zampini 44318f1ea47aSStefano Zampini Output Parameter: 44328f1ea47aSStefano Zampini . array - pointer to the data 44338f1ea47aSStefano Zampini 44348f1ea47aSStefano Zampini Level: intermediate 44358f1ea47aSStefano Zampini 4436db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44378f1ea47aSStefano Zampini @*/ 4438d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4439d71ae5a4SJacob Faibussowitsch { 4440d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44418f1ea47aSStefano Zampini 44428f1ea47aSStefano Zampini PetscFunctionBegin; 4443d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44449566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4445d67d9f35SJunchao Zhang } else { 4446d67d9f35SJunchao Zhang *array = NULL; 4447d67d9f35SJunchao Zhang } 4448d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4449d67d9f35SJunchao Zhang } 4450d67d9f35SJunchao Zhang 4451d67d9f35SJunchao Zhang /*@C 445211a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4453d67d9f35SJunchao Zhang 4454d67d9f35SJunchao Zhang Not Collective 4455d67d9f35SJunchao Zhang 4456d67d9f35SJunchao Zhang Input Parameter: 445711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4458d67d9f35SJunchao Zhang 4459d67d9f35SJunchao Zhang Output Parameter: 4460d67d9f35SJunchao Zhang . array - pointer to the data 4461d67d9f35SJunchao Zhang 4462d67d9f35SJunchao Zhang Level: intermediate 4463d67d9f35SJunchao Zhang 4464db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4465d67d9f35SJunchao Zhang @*/ 4466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4467d71ae5a4SJacob Faibussowitsch { 4468d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4469d67d9f35SJunchao Zhang 4470d67d9f35SJunchao Zhang PetscFunctionBegin; 4471d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 44729566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4473d67d9f35SJunchao Zhang } else { 4474d67d9f35SJunchao Zhang *array = aij->a; 4475d67d9f35SJunchao Zhang } 44769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44779566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4478d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4479d67d9f35SJunchao Zhang } 4480d67d9f35SJunchao Zhang 4481d67d9f35SJunchao Zhang /*@C 4482d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4483d67d9f35SJunchao Zhang 4484d67d9f35SJunchao Zhang Not Collective 4485d67d9f35SJunchao Zhang 4486d67d9f35SJunchao Zhang Input Parameter: 4487d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4488d67d9f35SJunchao Zhang 4489d67d9f35SJunchao Zhang Output Parameter: 4490d67d9f35SJunchao Zhang . array - pointer to the data 4491d67d9f35SJunchao Zhang 4492d67d9f35SJunchao Zhang Level: intermediate 4493d67d9f35SJunchao Zhang 4494db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4495d67d9f35SJunchao Zhang @*/ 4496d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4497d71ae5a4SJacob Faibussowitsch { 4498d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4499d67d9f35SJunchao Zhang 4500d67d9f35SJunchao Zhang PetscFunctionBegin; 4501d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45029566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4503d67d9f35SJunchao Zhang } else { 4504d67d9f35SJunchao Zhang *array = NULL; 4505d67d9f35SJunchao Zhang } 45068f1ea47aSStefano Zampini PetscFunctionReturn(0); 45078f1ea47aSStefano Zampini } 45088f1ea47aSStefano Zampini 45098f1ea47aSStefano Zampini /*@C 451011a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45117ee59b9bSJunchao Zhang 45127ee59b9bSJunchao Zhang Not Collective 45137ee59b9bSJunchao Zhang 45147ee59b9bSJunchao Zhang Input Parameter: 451511a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45167ee59b9bSJunchao Zhang 45177ee59b9bSJunchao Zhang Output Parameters: 45187ee59b9bSJunchao Zhang + i - row map array of the matrix 45197ee59b9bSJunchao Zhang . j - column index array of the matrix 45207ee59b9bSJunchao Zhang . a - data array of the matrix 45217ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45227ee59b9bSJunchao Zhang 45237ee59b9bSJunchao Zhang Notes: 45247ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45257ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45267ee59b9bSJunchao Zhang 45277ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45287ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45297ee59b9bSJunchao Zhang 45307ee59b9bSJunchao Zhang Level: Developer 45317ee59b9bSJunchao Zhang 4532db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45337ee59b9bSJunchao Zhang @*/ 4534d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4535d71ae5a4SJacob Faibussowitsch { 45367ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45377ee59b9bSJunchao Zhang 45387ee59b9bSJunchao Zhang PetscFunctionBegin; 45397ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45407ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45417ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45427ee59b9bSJunchao Zhang } else { 45437ee59b9bSJunchao Zhang if (i) *i = aij->i; 45447ee59b9bSJunchao Zhang if (j) *j = aij->j; 45457ee59b9bSJunchao Zhang if (a) *a = aij->a; 45467ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45477ee59b9bSJunchao Zhang } 45487ee59b9bSJunchao Zhang PetscFunctionReturn(0); 45497ee59b9bSJunchao Zhang } 45507ee59b9bSJunchao Zhang 45517ee59b9bSJunchao Zhang /*@C 455221e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 455321e72a00SBarry Smith 455421e72a00SBarry Smith Not Collective 455521e72a00SBarry Smith 455621e72a00SBarry Smith Input Parameter: 455711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 455821e72a00SBarry Smith 455921e72a00SBarry Smith Output Parameter: 456021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 456121e72a00SBarry Smith 456221e72a00SBarry Smith Level: intermediate 456321e72a00SBarry Smith 4564db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 456521e72a00SBarry Smith @*/ 4566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4567d71ae5a4SJacob Faibussowitsch { 456821e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 456921e72a00SBarry Smith 457021e72a00SBarry Smith PetscFunctionBegin; 457121e72a00SBarry Smith *nz = aij->rmax; 457221e72a00SBarry Smith PetscFunctionReturn(0); 457321e72a00SBarry Smith } 457421e72a00SBarry Smith 4575d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4576d71ae5a4SJacob Faibussowitsch { 4577394ed5ebSJunchao Zhang MPI_Comm comm; 4578394ed5ebSJunchao Zhang PetscInt *i, *j; 4579394ed5ebSJunchao Zhang PetscInt M, N, row; 4580394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4581394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4582394ed5ebSJunchao Zhang PetscInt *Aj; 4583394ed5ebSJunchao Zhang PetscScalar *Aa; 4584cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4585cbc6b225SStefano Zampini MatType rtype; 4586394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4587394ed5ebSJunchao Zhang 4588394ed5ebSJunchao Zhang PetscFunctionBegin; 45899566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 45909566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 45919566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4592e8729f6fSJunchao Zhang i = coo_i; 4593e8729f6fSJunchao Zhang j = coo_j; 45949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4595394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4596394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4597394ed5ebSJunchao Zhang perm[k] = k; 4598394ed5ebSJunchao Zhang } 4599394ed5ebSJunchao Zhang 4600394ed5ebSJunchao Zhang /* Sort by row */ 46019566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46029371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46039371c9d4SSatish Balay if (i[k] >= 0) break; 46049371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4605394ed5ebSJunchao Zhang nneg = k; 46069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4607394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4608394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4609394ed5ebSJunchao Zhang 46109566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4612394ed5ebSJunchao Zhang 4613394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4614394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4615394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4616394ed5ebSJunchao Zhang while (k < coo_n) { 4617394ed5ebSJunchao Zhang row = i[k]; 4618394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4619394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4620394ed5ebSJunchao Zhang end = k; 46219566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4622394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4623394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4624394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4625394ed5ebSJunchao Zhang Ai[row] = 1; 4626394ed5ebSJunchao Zhang nnz++; 4627394ed5ebSJunchao Zhang 4628394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4629394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4630394ed5ebSJunchao Zhang q++; 4631394ed5ebSJunchao Zhang jmap[q] = 1; 4632394ed5ebSJunchao Zhang Aj[q] = j[p]; 4633394ed5ebSJunchao Zhang Ai[row]++; 4634394ed5ebSJunchao Zhang nnz++; 4635394ed5ebSJunchao Zhang } else { 4636394ed5ebSJunchao Zhang jmap[q]++; 4637394ed5ebSJunchao Zhang } 4638394ed5ebSJunchao Zhang } 4639394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4640394ed5ebSJunchao Zhang } 4641394ed5ebSJunchao Zhang 4642394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4643394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4644394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4645394ed5ebSJunchao Zhang jmap[0] = 0; 4646394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4647394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4648394ed5ebSJunchao Zhang PetscCount *jmap_new; 4649394ed5ebSJunchao Zhang PetscInt *Aj_new; 4650394ed5ebSJunchao Zhang 46519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 46529566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 46539566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4654394ed5ebSJunchao Zhang jmap = jmap_new; 4655394ed5ebSJunchao Zhang 46569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 46579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 46589566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4659394ed5ebSJunchao Zhang Aj = Aj_new; 4660394ed5ebSJunchao Zhang } 4661394ed5ebSJunchao Zhang 4662394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4663394ed5ebSJunchao Zhang PetscCount *perm_new; 4664cbc6b225SStefano Zampini 46659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 46669566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 46679566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4668394ed5ebSJunchao Zhang perm = perm_new; 4669394ed5ebSJunchao Zhang } 4670394ed5ebSJunchao Zhang 46719566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 46729566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 46739566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4674394ed5ebSJunchao Zhang 4675394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4676394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4677394ed5ebSJunchao Zhang /* Record COO fields */ 4678394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4679394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4680394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4681394ed5ebSJunchao Zhang seqaij->perm = perm; 4682394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4683394ed5ebSJunchao Zhang } 4684394ed5ebSJunchao Zhang 4685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4686d71ae5a4SJacob Faibussowitsch { 4687394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4688394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4689394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4690394ed5ebSJunchao Zhang PetscScalar *Aa; 4691394ed5ebSJunchao Zhang 4692394ed5ebSJunchao Zhang PetscFunctionBegin; 46939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4694394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4695b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4696b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4697b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4698394ed5ebSJunchao Zhang } 46999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 4700394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4701394ed5ebSJunchao Zhang } 4702394ed5ebSJunchao Zhang 470334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47045063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 470502fe1965SBarry Smith #endif 47063d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47075063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47083d0639e7SStefano Zampini #endif 470902fe1965SBarry Smith 4710d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4711d71ae5a4SJacob Faibussowitsch { 4712273d9f13SBarry Smith Mat_SeqAIJ *b; 471338baddfdSBarry Smith PetscMPIInt size; 4714273d9f13SBarry Smith 4715273d9f13SBarry Smith PetscFunctionBegin; 47169566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 471708401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4718273d9f13SBarry Smith 47194dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47202205254eSKarl Rupp 4721b0a32e0cSBarry Smith B->data = (void *)b; 47222205254eSKarl Rupp 47239566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4724071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47252205254eSKarl Rupp 4726f4259b30SLisandro Dalcin b->row = NULL; 4727f4259b30SLisandro Dalcin b->col = NULL; 4728f4259b30SLisandro Dalcin b->icol = NULL; 4729b810aeb4SBarry Smith b->reallocs = 0; 473036db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4731f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4732416022c9SBarry Smith b->nonew = 0; 4733f4259b30SLisandro Dalcin b->diag = NULL; 4734f4259b30SLisandro Dalcin b->solve_work = NULL; 4735f4259b30SLisandro Dalcin B->spptr = NULL; 4736f4259b30SLisandro Dalcin b->saved_values = NULL; 4737f4259b30SLisandro Dalcin b->idiag = NULL; 4738f4259b30SLisandro Dalcin b->mdiag = NULL; 4739f4259b30SLisandro Dalcin b->ssor_work = NULL; 474071f1c65dSBarry Smith b->omega = 1.0; 474171f1c65dSBarry Smith b->fshift = 0.0; 474271f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4743bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4744a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 474517ab2063SBarry Smith 47469566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4747d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 47489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 47499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4750b3866ffcSBarry Smith #endif 47519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 47529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 47539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 47549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 47559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 47569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 47579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 47589779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 47599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4760191b95cbSRichard Tran Mills #endif 476134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 47639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 476502fe1965SBarry Smith #endif 47663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 47683d0639e7SStefano Zampini #endif 47699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4770af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 47719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4772af8000cdSHong Zhang #endif 4773d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 47749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4775d24d4204SJose E. Roman #endif 477663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 47779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 47789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 477963c07aadSStefano Zampini #endif 47809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 47819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 47829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 47839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 47849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 47859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 47869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 47879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 47889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 47899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 47909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 47919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 47929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 47939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 47949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 47959566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 47969566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 47979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 47983a40ed3dSBarry Smith PetscFunctionReturn(0); 479917ab2063SBarry Smith } 480017ab2063SBarry Smith 4801b24902e0SBarry Smith /* 48023893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4803b24902e0SBarry Smith */ 4804d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4805d71ae5a4SJacob Faibussowitsch { 48062a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4807071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 480817ab2063SBarry Smith 48093a40ed3dSBarry Smith PetscFunctionBegin; 4810aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4811273d9f13SBarry Smith 4812d5f3da31SBarry Smith C->factortype = A->factortype; 4813f4259b30SLisandro Dalcin c->row = NULL; 4814f4259b30SLisandro Dalcin c->col = NULL; 4815f4259b30SLisandro Dalcin c->icol = NULL; 48166ad4291fSHong Zhang c->reallocs = 0; 481717ab2063SBarry Smith 481869272f91SPierre Jolivet C->assembled = A->assembled; 481969272f91SPierre Jolivet C->preallocated = A->preallocated; 482017ab2063SBarry Smith 482169272f91SPierre Jolivet if (A->preallocated) { 48229566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48239566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4824eec197d1SBarry Smith 48259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48269566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48289566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 482917ab2063SBarry Smith 483017ab2063SBarry Smith /* allocate the matrix space */ 4831f77e22a1SHong Zhang if (mallocmatspace) { 48329566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48332205254eSKarl Rupp 4834f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48352205254eSKarl Rupp 48369566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 483717ab2063SBarry Smith if (m > 0) { 48389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4839be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48402e5835c6SStefano Zampini const PetscScalar *aa; 48412e5835c6SStefano Zampini 48429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 48439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 48449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4845be6bf707SBarry Smith } else { 48469566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 484717ab2063SBarry Smith } 484808480c60SBarry Smith } 4849f77e22a1SHong Zhang } 485017ab2063SBarry Smith 48516ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4852416022c9SBarry Smith c->roworiented = a->roworiented; 4853416022c9SBarry Smith c->nonew = a->nonew; 4854416022c9SBarry Smith if (a->diag) { 48559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 48569566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4857071fcb05SBarry Smith } else c->diag = NULL; 48582205254eSKarl Rupp 4859f4259b30SLisandro Dalcin c->solve_work = NULL; 4860f4259b30SLisandro Dalcin c->saved_values = NULL; 4861f4259b30SLisandro Dalcin c->idiag = NULL; 4862f4259b30SLisandro Dalcin c->ssor_work = NULL; 4863a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4864e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4865e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 48666ad4291fSHong Zhang 4867893ad86cSHong Zhang c->rmax = a->rmax; 4868416022c9SBarry Smith c->nz = a->nz; 48698ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4870754ec7b1SSatish Balay 48716ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 48726ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4873cd6b891eSBarry Smith if (a->compressedrow.use) { 48746ad4291fSHong Zhang i = a->compressedrow.nrows; 48759566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 48769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 48779566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 487827ea64f8SHong Zhang } else { 487927ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 48800298fd71SBarry Smith c->compressedrow.i = NULL; 48810298fd71SBarry Smith c->compressedrow.rindex = NULL; 48826ad4291fSHong Zhang } 4883ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4884e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 48854846f1f5SKris Buschelman 48869566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 488769272f91SPierre Jolivet } 48889566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 48893a40ed3dSBarry Smith PetscFunctionReturn(0); 489017ab2063SBarry Smith } 489117ab2063SBarry Smith 4892d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4893d71ae5a4SJacob Faibussowitsch { 4894b24902e0SBarry Smith PetscFunctionBegin; 48959566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 48969566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 489748a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 48989566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 48999566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 4900b24902e0SBarry Smith PetscFunctionReturn(0); 4901b24902e0SBarry Smith } 4902b24902e0SBarry Smith 4903d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4904d71ae5a4SJacob Faibussowitsch { 490552f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 490652f91c60SVaclav Hapla 490752f91c60SVaclav Hapla PetscFunctionBegin; 490852f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 490952f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4910c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49119566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 491452f91c60SVaclav Hapla if (isbinary) { 49159566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 491652f91c60SVaclav Hapla } else if (ishdf5) { 491752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49189566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 491952f91c60SVaclav Hapla #else 492052f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 492152f91c60SVaclav Hapla #endif 492252f91c60SVaclav Hapla } else { 492398921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 492452f91c60SVaclav Hapla } 492552f91c60SVaclav Hapla PetscFunctionReturn(0); 492652f91c60SVaclav Hapla } 492752f91c60SVaclav Hapla 4928d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4929d71ae5a4SJacob Faibussowitsch { 49303ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49313ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4932fbdbba38SShri Abhyankar 4933fbdbba38SShri Abhyankar PetscFunctionBegin; 49349566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4935bbead8a2SBarry Smith 49363ea6fe3dSLisandro Dalcin /* read in matrix header */ 49379566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 493808401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 49399371c9d4SSatish Balay M = header[1]; 49409371c9d4SSatish Balay N = header[2]; 49419371c9d4SSatish Balay nz = header[3]; 494208401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 494308401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 494408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 4945fbdbba38SShri Abhyankar 49463ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 49479566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 49483ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 49493ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 49503ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 49513ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 49523ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 49539566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 49549566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 49553ea6fe3dSLisandro Dalcin 49563ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 49579566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4958aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49593ea6fe3dSLisandro Dalcin 4960fbdbba38SShri Abhyankar /* read in row lengths */ 49619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 49629566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 49633ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 49649371c9d4SSatish Balay sum = 0; 49659371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 496608401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 49673ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 49689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 49699566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 4970aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 49713ea6fe3dSLisandro Dalcin /* store row lengths */ 49729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 49739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 4974fbdbba38SShri Abhyankar 49753ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 49769371c9d4SSatish Balay a->i[0] = 0; 49779371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 49783ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 49799566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 49803ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 49819566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 4982fbdbba38SShri Abhyankar 49839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 49849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 4985fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4986fbdbba38SShri Abhyankar } 4987fbdbba38SShri Abhyankar 4988d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 4989d71ae5a4SJacob Faibussowitsch { 49907264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 4991fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4992eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4993eeffb40dSHong Zhang PetscInt k; 4994eeffb40dSHong Zhang #endif 49957264ac53SSatish Balay 49963a40ed3dSBarry Smith PetscFunctionBegin; 4997bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4998d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 4999ca44d042SBarry Smith *flg = PETSC_FALSE; 5000ca44d042SBarry Smith PetscFunctionReturn(0); 5001bcd2baecSBarry Smith } 50027264ac53SSatish Balay 50037264ac53SSatish Balay /* if the a->i are the same */ 50049566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 5005abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50067264ac53SSatish Balay 50077264ac53SSatish Balay /* if a->j are the same */ 50089566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 5009abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5010bcd2baecSBarry Smith 50119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5013bcd2baecSBarry Smith /* if a->a are the same */ 5014eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5015eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5016fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5017eeffb40dSHong Zhang *flg = PETSC_FALSE; 50183a40ed3dSBarry Smith PetscFunctionReturn(0); 5019eeffb40dSHong Zhang } 5020eeffb40dSHong Zhang } 5021eeffb40dSHong Zhang #else 50229566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5023eeffb40dSHong Zhang #endif 50249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 5026eeffb40dSHong Zhang PetscFunctionReturn(0); 50277264ac53SSatish Balay } 502836db0b34SBarry Smith 502905869f15SSatish Balay /*@ 503011a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 503136db0b34SBarry Smith provided by the user. 503236db0b34SBarry Smith 5033d083f849SBarry Smith Collective 503436db0b34SBarry Smith 503536db0b34SBarry Smith Input Parameters: 503636db0b34SBarry Smith + comm - must be an MPI communicator of size 1 503736db0b34SBarry Smith . m - number of rows 503836db0b34SBarry Smith . n - number of columns 5039483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 504036db0b34SBarry Smith . j - column indices 504136db0b34SBarry Smith - a - matrix values 504236db0b34SBarry Smith 504336db0b34SBarry Smith Output Parameter: 504436db0b34SBarry Smith . mat - the matrix 504536db0b34SBarry Smith 504636db0b34SBarry Smith Level: intermediate 504736db0b34SBarry Smith 504836db0b34SBarry Smith Notes: 50490551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5050292fb18eSBarry Smith once the matrix is destroyed and not before 505136db0b34SBarry Smith 505236db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 505336db0b34SBarry Smith 5054bfeeae90SHong Zhang The i and j indices are 0 based 505536db0b34SBarry Smith 5056a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5057a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 50588eef79e4SBarry Smith as shown 5059a4552177SSatish Balay 50608eef79e4SBarry Smith $ 1 0 0 50618eef79e4SBarry Smith $ 2 0 3 50628eef79e4SBarry Smith $ 4 5 6 50638eef79e4SBarry Smith $ 50648eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 50658eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 50668eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5067a4552177SSatish Balay 5068db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 506936db0b34SBarry Smith @*/ 5070d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5071d71ae5a4SJacob Faibussowitsch { 5072cbcfb4deSHong Zhang PetscInt ii; 507336db0b34SBarry Smith Mat_SeqAIJ *aij; 5074cbcfb4deSHong Zhang PetscInt jj; 507536db0b34SBarry Smith 507636db0b34SBarry Smith PetscFunctionBegin; 5077aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 50789566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 50799566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 50809566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 50819566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 50829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5083ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 50849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 50859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5086ab93d7beSBarry Smith 508736db0b34SBarry Smith aij->i = i; 508836db0b34SBarry Smith aij->j = j; 508936db0b34SBarry Smith aij->a = a; 509036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 509136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5092e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5093e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 509436db0b34SBarry Smith 5095cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 509636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 509776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5098aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 50999985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 510008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 510108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51029985e31cSBarry Smith } 510336db0b34SBarry Smith } 510476bd3646SJed Brown } 510576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 510636db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 510708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5108aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 510936db0b34SBarry Smith } 511076bd3646SJed Brown } 511136db0b34SBarry Smith 51129566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51139566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 511436db0b34SBarry Smith PetscFunctionReturn(0); 511536db0b34SBarry Smith } 5116cbc6b225SStefano Zampini 5117f62e3866SBarry Smith /*@ 511811a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51198a0b0e6bSVictor Minden provided by the user. 51208a0b0e6bSVictor Minden 5121d083f849SBarry Smith Collective 51228a0b0e6bSVictor Minden 51238a0b0e6bSVictor Minden Input Parameters: 51248a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51258a0b0e6bSVictor Minden . m - number of rows 51268a0b0e6bSVictor Minden . n - number of columns 51278a0b0e6bSVictor Minden . i - row indices 51288a0b0e6bSVictor Minden . j - column indices 51291230e6d1SVictor Minden . a - matrix values 51301230e6d1SVictor Minden . nz - number of nonzeros 513111a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51328a0b0e6bSVictor Minden 51338a0b0e6bSVictor Minden Output Parameter: 51348a0b0e6bSVictor Minden . mat - the matrix 51358a0b0e6bSVictor Minden 51368a0b0e6bSVictor Minden Level: intermediate 51378a0b0e6bSVictor Minden 5138f62e3866SBarry Smith Example: 5139f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 51409e99939fSJunchao Zhang .vb 51418a0b0e6bSVictor Minden 1 0 0 51428a0b0e6bSVictor Minden 2 0 3 51438a0b0e6bSVictor Minden 4 5 6 51448a0b0e6bSVictor Minden 51458a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 51468a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 51478a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 51489e99939fSJunchao Zhang .ve 51498a0b0e6bSVictor Minden 5150db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()` 51518a0b0e6bSVictor Minden @*/ 5152d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5153d71ae5a4SJacob Faibussowitsch { 5154d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 51558a0b0e6bSVictor Minden 51568a0b0e6bSVictor Minden PetscFunctionBegin; 51579566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5158ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 51599566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51609566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51619566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 51631230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 51641230e6d1SVictor Minden if (idx) { 51651230e6d1SVictor Minden row = i[ii] - 1; 51661230e6d1SVictor Minden col = j[ii] - 1; 51671230e6d1SVictor Minden } else { 51681230e6d1SVictor Minden row = i[ii]; 51691230e6d1SVictor Minden col = j[ii]; 51708a0b0e6bSVictor Minden } 51719566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 51728a0b0e6bSVictor Minden } 51739566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51749566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51759566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 51768a0b0e6bSVictor Minden PetscFunctionReturn(0); 51778a0b0e6bSVictor Minden } 517836db0b34SBarry Smith 5179d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5180d71ae5a4SJacob Faibussowitsch { 5181acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5182acf2f550SJed Brown 5183acf2f550SJed Brown PetscFunctionBegin; 5184acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5185acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 51862205254eSKarl Rupp 51879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5188acf2f550SJed Brown PetscFunctionReturn(0); 5189acf2f550SJed Brown } 5190acf2f550SJed Brown 5191d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5192d71ae5a4SJacob Faibussowitsch { 51939c8f2541SHong Zhang PetscFunctionBegin; 51949566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 51959c8f2541SHong Zhang PetscFunctionReturn(0); 51969c8f2541SHong Zhang } 51979c8f2541SHong Zhang 519881824310SBarry Smith /* 519953dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 520053dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 520153dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 520253dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 520353dd7562SDmitry Karpeev */ 5204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5205d71ae5a4SJacob Faibussowitsch { 520653dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 520753dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 520853dd7562SDmitry Karpeev PetscBool seqaij; 520953dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 521053dd7562SDmitry Karpeev PetscScalar v; 521153dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 521253dd7562SDmitry Karpeev 521353dd7562SDmitry Karpeev PetscFunctionBegin; 521453dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 521553dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52169566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 521728b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 521853dd7562SDmitry Karpeev if (rowemb) { 52199566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 522008401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 522153dd7562SDmitry Karpeev } else { 522208401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 522353dd7562SDmitry Karpeev } 522453dd7562SDmitry Karpeev if (colemb) { 52259566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 522608401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 522753dd7562SDmitry Karpeev } else { 522808401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 522953dd7562SDmitry Karpeev } 523053dd7562SDmitry Karpeev 523153dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 523253dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5234ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 52369566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 523753dd7562SDmitry Karpeev } 523848a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 523953dd7562SDmitry Karpeev count = 0; 524053dd7562SDmitry Karpeev rowindices = NULL; 524153dd7562SDmitry Karpeev colindices = NULL; 524248a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 524348a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 524453dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 524553dd7562SDmitry Karpeev PetscInt row; 524653dd7562SDmitry Karpeev row = i; 524753dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 524853dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 524953dd7562SDmitry Karpeev PetscInt col; 525053dd7562SDmitry Karpeev col = Baij->j[count]; 525153dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 525253dd7562SDmitry Karpeev v = Baij->a[count]; 52539566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 525453dd7562SDmitry Karpeev ++count; 525553dd7562SDmitry Karpeev } 525653dd7562SDmitry Karpeev } 525753dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 525853dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 525953dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 526053dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 526153dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 526253dd7562SDmitry Karpeev PetscFunctionReturn(0); 526353dd7562SDmitry Karpeev } 526453dd7562SDmitry Karpeev 5265*dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A) 5266*dec0b466SHong Zhang { 5267*dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5268*dec0b466SHong Zhang MatScalar *aa = a->a; 5269*dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5270*dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5271*dec0b466SHong Zhang 5272*dec0b466SHong Zhang PetscFunctionBegin; 5273*dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5274*dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5275*dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5276*dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5277*dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 5278*dec0b466SHong Zhang if (aa[k] == 0 && aj[k] != i - 1) fshift++; 5279*dec0b466SHong Zhang else { 5280*dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5281*dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5282*dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5283*dec0b466SHong Zhang } 5284*dec0b466SHong Zhang } 5285*dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5286*dec0b466SHong Zhang fshift_prev = fshift; 5287*dec0b466SHong Zhang /* reset ilen and imax for each row */ 5288*dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5289*dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5290*dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5291*dec0b466SHong Zhang } 5292*dec0b466SHong Zhang if (m) { 5293*dec0b466SHong Zhang ai[m] -= fshift; 5294*dec0b466SHong Zhang a->nz = ai[m]; 5295*dec0b466SHong Zhang } 5296*dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5297*dec0b466SHong Zhang A->nonzerostate -= fshift; 5298*dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5299*dec0b466SHong Zhang a->rmax = rmax; 5300*dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5301*dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5302*dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5303*dec0b466SHong Zhang PetscFunctionReturn(0); 5304*dec0b466SHong Zhang } 5305*dec0b466SHong Zhang 53064099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53074099cc6bSBarry Smith 53084099cc6bSBarry Smith /*@C 530911a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53104099cc6bSBarry Smith 531111a5261eSBarry Smith Collective on mat 53124099cc6bSBarry Smith 53134099cc6bSBarry Smith Input Parameters: 53144099cc6bSBarry Smith + mat - the matrix object 53154099cc6bSBarry Smith - matype - matrix type 53164099cc6bSBarry Smith 53174099cc6bSBarry Smith Options Database Key: 53184099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53194099cc6bSBarry Smith 53204099cc6bSBarry Smith Level: intermediate 53214099cc6bSBarry Smith 5322db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53234099cc6bSBarry Smith @*/ 5324d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5325d71ae5a4SJacob Faibussowitsch { 53264099cc6bSBarry Smith PetscBool sametype; 53275f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53284099cc6bSBarry Smith 53294099cc6bSBarry Smith PetscFunctionBegin; 53304099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53319566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53324099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53334099cc6bSBarry Smith 53349566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53355f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 53369566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 53374099cc6bSBarry Smith PetscFunctionReturn(0); 53384099cc6bSBarry Smith } 53394099cc6bSBarry Smith 53404099cc6bSBarry Smith /*@C 534111a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 53424099cc6bSBarry Smith 53434099cc6bSBarry Smith Not Collective 53444099cc6bSBarry Smith 53454099cc6bSBarry Smith Input Parameters: 534611a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 53474099cc6bSBarry Smith - function - routine to convert to subtype 53484099cc6bSBarry Smith 53494099cc6bSBarry Smith Notes: 535011a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 53514099cc6bSBarry Smith 53524099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 53534099cc6bSBarry Smith $ -mat_seqaij_type my_mat 53544099cc6bSBarry Smith 53554099cc6bSBarry Smith Level: advanced 53564099cc6bSBarry Smith 5357db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 53584099cc6bSBarry Smith @*/ 5359d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5360d71ae5a4SJacob Faibussowitsch { 53614099cc6bSBarry Smith PetscFunctionBegin; 53629566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 53639566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 53644099cc6bSBarry Smith PetscFunctionReturn(0); 53654099cc6bSBarry Smith } 53664099cc6bSBarry Smith 53674099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 53684099cc6bSBarry Smith 53694099cc6bSBarry Smith /*@C 537011a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 53714099cc6bSBarry Smith 53724099cc6bSBarry Smith Not Collective 53734099cc6bSBarry Smith 53744099cc6bSBarry Smith Level: advanced 53754099cc6bSBarry Smith 5376db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 53774099cc6bSBarry Smith @*/ 5378d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5379d71ae5a4SJacob Faibussowitsch { 53804099cc6bSBarry Smith PetscFunctionBegin; 53814099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 53824099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 53834099cc6bSBarry Smith 53849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 53859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 53869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 53879779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 53889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5389485f9817SRichard Tran Mills #endif 53905063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 53919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 53925063d097SStefano Zampini #endif 53935063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 53949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 53955063d097SStefano Zampini #endif 53964099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 53979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 53984099cc6bSBarry Smith #endif 53994099cc6bSBarry Smith PetscFunctionReturn(0); 54004099cc6bSBarry Smith } 540153dd7562SDmitry Karpeev 540253dd7562SDmitry Karpeev /* 540381824310SBarry Smith Special version for direct calls from Fortran 540481824310SBarry Smith */ 5405af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 540681824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 540781824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 540881824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 540981824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 541081824310SBarry Smith #endif 541181824310SBarry Smith 541281824310SBarry Smith /* Change these macros so can be used in void function */ 541398921bdaSJacob Faibussowitsch 541498921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54159566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54169566063dSJacob Faibussowitsch #undef PetscCall 54179371c9d4SSatish Balay #define PetscCall(...) \ 54189371c9d4SSatish Balay do { \ 54195f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 542098921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 542198921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 542298921bdaSJacob Faibussowitsch return; \ 542398921bdaSJacob Faibussowitsch } \ 542498921bdaSJacob Faibussowitsch } while (0) 542598921bdaSJacob Faibussowitsch 542698921bdaSJacob Faibussowitsch #undef SETERRQ 54279371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54289371c9d4SSatish Balay do { \ 542998921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 543098921bdaSJacob Faibussowitsch return; \ 543198921bdaSJacob Faibussowitsch } while (0) 543281824310SBarry Smith 5433d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5434d71ae5a4SJacob Faibussowitsch { 543581824310SBarry Smith Mat A = *AA; 543681824310SBarry Smith PetscInt m = *mm, n = *nn; 543781824310SBarry Smith InsertMode is = *isis; 543881824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 543981824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 544081824310SBarry Smith PetscInt *imax, *ai, *ailen; 544181824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 544254f21887SBarry Smith MatScalar *ap, value, *aa; 5443ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5444ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 544581824310SBarry Smith 544681824310SBarry Smith PetscFunctionBegin; 54474994cf47SJed Brown MatCheckPreallocated(A, 1); 544881824310SBarry Smith imax = a->imax; 544981824310SBarry Smith ai = a->i; 545081824310SBarry Smith ailen = a->ilen; 545181824310SBarry Smith aj = a->j; 545281824310SBarry Smith aa = a->a; 545381824310SBarry Smith 545481824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 545581824310SBarry Smith row = im[k]; 545681824310SBarry Smith if (row < 0) continue; 54575f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 54589371c9d4SSatish Balay rp = aj + ai[row]; 54599371c9d4SSatish Balay ap = aa + ai[row]; 54609371c9d4SSatish Balay rmax = imax[row]; 54619371c9d4SSatish Balay nrow = ailen[row]; 546281824310SBarry Smith low = 0; 546381824310SBarry Smith high = nrow; 546481824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 546581824310SBarry Smith if (in[l] < 0) continue; 54665f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 546781824310SBarry Smith col = in[l]; 54682205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 54692205254eSKarl Rupp else value = v[k + l * m]; 54702205254eSKarl Rupp 547181824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 547281824310SBarry Smith 54732205254eSKarl Rupp if (col <= lastcol) low = 0; 54742205254eSKarl Rupp else high = nrow; 547581824310SBarry Smith lastcol = col; 547681824310SBarry Smith while (high - low > 5) { 547781824310SBarry Smith t = (low + high) / 2; 547881824310SBarry Smith if (rp[t] > col) high = t; 547981824310SBarry Smith else low = t; 548081824310SBarry Smith } 548181824310SBarry Smith for (i = low; i < high; i++) { 548281824310SBarry Smith if (rp[i] > col) break; 548381824310SBarry Smith if (rp[i] == col) { 548481824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 548581824310SBarry Smith else ap[i] = value; 548681824310SBarry Smith goto noinsert; 548781824310SBarry Smith } 548881824310SBarry Smith } 548981824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 549081824310SBarry Smith if (nonew == 1) goto noinsert; 54915f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5492fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 54939371c9d4SSatish Balay N = nrow++ - 1; 54949371c9d4SSatish Balay a->nz++; 54959371c9d4SSatish Balay high++; 549681824310SBarry Smith /* shift up all the later entries in this row */ 549781824310SBarry Smith for (ii = N; ii >= i; ii--) { 549881824310SBarry Smith rp[ii + 1] = rp[ii]; 549981824310SBarry Smith ap[ii + 1] = ap[ii]; 550081824310SBarry Smith } 550181824310SBarry Smith rp[i] = col; 550281824310SBarry Smith ap[i] = value; 5503e56f5c9eSBarry Smith A->nonzerostate++; 550481824310SBarry Smith noinsert:; 550581824310SBarry Smith low = i + 1; 550681824310SBarry Smith } 550781824310SBarry Smith ailen[row] = nrow; 550881824310SBarry Smith } 550981824310SBarry Smith PetscFunctionReturnVoid(); 551081824310SBarry Smith } 551198921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 551298921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 551398921bdaSJacob Faibussowitsch * original definitions */ 55149566063dSJacob Faibussowitsch #undef PetscCall 551598921bdaSJacob Faibussowitsch #undef SETERRQ 5516