1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 50857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 418720833daSHong Zhang rp = aj + ai[row]; 419876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 49619b08ed1SBarry Smith ap = aa + ai[row]; 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 530db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 53219b08ed1SBarry Smith 533d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 534d71ae5a4SJacob Faibussowitsch { 53519b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53619b08ed1SBarry Smith 53719b08ed1SBarry Smith PetscFunctionBegin; 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5399566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 54019b08ed1SBarry Smith a->maxnz = nztotal; 5414dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54219b08ed1SBarry Smith if (!a->ilen) { 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith 54819b08ed1SBarry Smith /* allocate the matrix space */ 54919b08ed1SBarry Smith if (A->structure_only) { 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55219b08ed1SBarry Smith } else { 5539566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->i[0] = 0; 55619b08ed1SBarry Smith if (A->structure_only) { 55719b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55819b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55919b08ed1SBarry Smith } else { 56019b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56119b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56219b08ed1SBarry Smith } 56319b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56419b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56519b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56719b08ed1SBarry Smith } 56819b08ed1SBarry Smith 569d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 570d71ae5a4SJacob Faibussowitsch { 571071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 572071fcb05SBarry Smith PetscInt *rp, k, row; 573071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 574071fcb05SBarry Smith PetscInt *aj = a->j; 575fff043a9SJunchao Zhang MatScalar *aa, *ap; 576071fcb05SBarry Smith 577071fcb05SBarry Smith PetscFunctionBegin; 5789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 579071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 580071fcb05SBarry Smith row = im[k]; 5816bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 582071fcb05SBarry Smith rp = aj + ai[row]; 583071fcb05SBarry Smith ap = aa + ai[row]; 58448a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 585071fcb05SBarry Smith if (!A->structure_only) { 586071fcb05SBarry Smith if (v) { 5879566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 588071fcb05SBarry Smith v += n; 589071fcb05SBarry Smith } else { 5909566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith } 593071fcb05SBarry Smith ailen[row] = n; 594071fcb05SBarry Smith a->nz += n; 595071fcb05SBarry Smith } 5969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 598071fcb05SBarry Smith } 599071fcb05SBarry Smith 600d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 601d71ae5a4SJacob Faibussowitsch { 6027eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60397f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60497f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6054e208921SJed Brown const MatScalar *ap, *aa; 6067eb43aa7SLois Curfman McInnes 6073a40ed3dSBarry Smith PetscFunctionBegin; 6084e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6097eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6107eb43aa7SLois Curfman McInnes row = im[k]; 6119371c9d4SSatish Balay if (row < 0) { 6129371c9d4SSatish Balay v += n; 6139371c9d4SSatish Balay continue; 6149371c9d4SSatish Balay } /* negative row */ 61554c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6169371c9d4SSatish Balay rp = aj + ai[row]; 6179371c9d4SSatish Balay ap = aa + ai[row]; 6187eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6197eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6209371c9d4SSatish Balay if (in[l] < 0) { 6219371c9d4SSatish Balay v++; 6229371c9d4SSatish Balay continue; 6239371c9d4SSatish Balay } /* negative column */ 62454c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 625bfeeae90SHong Zhang col = in[l]; 6269371c9d4SSatish Balay high = nrow; 6279371c9d4SSatish Balay low = 0; /* assume unsorted */ 6287eb43aa7SLois Curfman McInnes while (high - low > 5) { 6297eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6307eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6317eb43aa7SLois Curfman McInnes else low = t; 6327eb43aa7SLois Curfman McInnes } 6337eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6347eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6357eb43aa7SLois Curfman McInnes if (rp[i] == col) { 636b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6377eb43aa7SLois Curfman McInnes goto finished; 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes } 64097e567efSBarry Smith *v++ = 0.0; 6417eb43aa7SLois Curfman McInnes finished:; 6427eb43aa7SLois Curfman McInnes } 6437eb43aa7SLois Curfman McInnes } 6444e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6467eb43aa7SLois Curfman McInnes } 6477eb43aa7SLois Curfman McInnes 648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 649d71ae5a4SJacob Faibussowitsch { 6503ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 651c898d852SStefano Zampini const PetscScalar *av; 6523ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6533ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65417ab2063SBarry Smith 6553a40ed3dSBarry Smith PetscFunctionBegin; 6569566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6572205254eSKarl Rupp 6583ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6593ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6603ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6613ea6fe3dSLisandro Dalcin nz = A->nz; 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* write matrix header */ 6643ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6659371c9d4SSatish Balay header[1] = M; 6669371c9d4SSatish Balay header[2] = N; 6679371c9d4SSatish Balay header[3] = nz; 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 669416022c9SBarry Smith 6703ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6723ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6739566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6749566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6753ea6fe3dSLisandro Dalcin /* store column indices */ 6769566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 677416022c9SBarry Smith /* store nonzero values */ 6789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6799566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 681b37d52dbSMark F. Adams 6823ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6839566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68517ab2063SBarry Smith } 686416022c9SBarry Smith 687d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 688d71ae5a4SJacob Faibussowitsch { 6897dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6907dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6917dc0baabSHong Zhang 6927dc0baabSHong Zhang PetscFunctionBegin; 6939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6947dc0baabSHong Zhang for (i = 0; i < m; i++) { 6959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69648a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6987dc0baabSHong Zhang } 6999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 7003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7017dc0baabSHong Zhang } 7027dc0baabSHong Zhang 70309573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 704cd155464SBarry Smith 705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 706d71ae5a4SJacob Faibussowitsch { 707416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 708c898d852SStefano Zampini const PetscScalar *av; 70960e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 710e060cb09SBarry Smith const char *name; 711f3ef73ceSBarry Smith PetscViewerFormat format; 71217ab2063SBarry Smith 7133a40ed3dSBarry Smith PetscFunctionBegin; 7147dc0baabSHong Zhang if (A->structure_only) { 7159566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7177dc0baabSHong Zhang } 71843e49210SHong Zhang 7199566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7203ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7212e5835c6SStefano Zampini 722c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72571c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72697f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72760e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 728c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 729d00d2cf4SBarry Smith nofinalvalue = 1; 730d00d2cf4SBarry Smith } 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #else 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 738fbfe6fa7SJed Brown #endif 7399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 74017ab2063SBarry Smith 74117ab2063SBarry Smith for (i = 0; i < m; i++) { 74260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74517ab2063SBarry Smith #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74717ab2063SBarry Smith #endif 74817ab2063SBarry Smith } 74917ab2063SBarry Smith } 750d00d2cf4SBarry Smith if (nofinalvalue) { 751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 753c337ccceSJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 755c337ccceSJed Brown #endif 756d00d2cf4SBarry Smith } 7579566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 760fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76244cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 77036db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7726831982aSBarry Smith } 77344cd7ae7SLois Curfman McInnes #else 7749566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77544cd7ae7SLois Curfman McInnes #endif 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77844cd7ae7SLois Curfman McInnes } 7799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 780fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78197f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 784496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 785496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 787496be53dSLois Curfman McInnes if (a->j[j] >= i) { 788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 790496be53dSLois Curfman McInnes #else 791496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 792496be53dSLois Curfman McInnes #endif 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 795496be53dSLois Curfman McInnes } 7962e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7982e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7992205254eSKarl Rupp if (i + 4 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8012205254eSKarl Rupp } else if (i + 3 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8032205254eSKarl Rupp } else if (i + 2 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8052205254eSKarl Rupp } else if (i + 1 < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8072205254eSKarl Rupp } else if (i < m) { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8092205254eSKarl Rupp } else { 8109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8112205254eSKarl Rupp } 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8149566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 815496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8179566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes } 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 822496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 824496be53dSLois Curfman McInnes if (a->j[j] >= i) { 825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82648a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 827496be53dSLois Curfman McInnes #else 8289566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 829496be53dSLois Curfman McInnes #endif 830496be53dSLois Curfman McInnes } 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 833496be53dSLois Curfman McInnes } 8349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 835fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83697f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83787828ca2SBarry Smith PetscScalar value; 83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83968f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 84068f1ed48SBarry Smith 84168f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84268f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84368f1ed48SBarry Smith realonly = PETSC_FALSE; 84468f1ed48SBarry Smith break; 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith } 84768f1ed48SBarry Smith #endif 84802594712SBarry Smith 8499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 85002594712SBarry Smith for (i = 0; i < m; i++) { 85102594712SBarry Smith jcnt = 0; 852d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 853e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85402594712SBarry Smith value = a->a[cnt++]; 855e24b481bSBarry Smith jcnt++; 85602594712SBarry Smith } else { 85702594712SBarry Smith value = 0.0; 85802594712SBarry Smith } 859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86068f1ed48SBarry Smith if (realonly) { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86268f1ed48SBarry Smith } else { 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86468f1ed48SBarry Smith } 86502594712SBarry Smith #else 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86702594712SBarry Smith #endif 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 87002594712SBarry Smith } 8719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8723c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 873150b93efSMatthew G. Knepley PetscInt fshift = 1; 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8793c215bfdSMatthew Knepley #endif 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8813c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8853c215bfdSMatthew Knepley #else 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8873c215bfdSMatthew Knepley #endif 8883c215bfdSMatthew Knepley } 8893c215bfdSMatthew Knepley } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8913a40ed3dSBarry Smith } else { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 893d5f3da31SBarry Smith if (A->factortype) { 89416cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89616cd7e1dSShri Abhyankar /* L part */ 89760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90316cd7e1dSShri Abhyankar } else { 9049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90516cd7e1dSShri Abhyankar } 90616cd7e1dSShri Abhyankar #else 9079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90816cd7e1dSShri Abhyankar #endif 90916cd7e1dSShri Abhyankar } 91016cd7e1dSShri Abhyankar /* diagonal */ 91116cd7e1dSShri Abhyankar j = a->diag[i]; 91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91716cd7e1dSShri Abhyankar } else { 9189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91916cd7e1dSShri Abhyankar } 92016cd7e1dSShri Abhyankar #else 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92216cd7e1dSShri Abhyankar #endif 92316cd7e1dSShri Abhyankar 92416cd7e1dSShri Abhyankar /* U part */ 92560e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93116cd7e1dSShri Abhyankar } else { 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar #else 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93616cd7e1dSShri Abhyankar #endif 93716cd7e1dSShri Abhyankar } 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93916cd7e1dSShri Abhyankar } 94016cd7e1dSShri Abhyankar } else { 94117ab2063SBarry Smith for (i = 0; i < m; i++) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9493a40ed3dSBarry Smith } else { 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95117ab2063SBarry Smith } 95217ab2063SBarry Smith #else 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95417ab2063SBarry Smith #endif 95517ab2063SBarry Smith } 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95717ab2063SBarry Smith } 95816cd7e1dSShri Abhyankar } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 96017ab2063SBarry Smith } 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 963416022c9SBarry Smith } 964416022c9SBarry Smith 9659804daf3SBarry Smith #include <petscdraw.h> 966d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 967d71ae5a4SJacob Faibussowitsch { 968480ef9eaSBarry Smith Mat A = (Mat)Aa; 969416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 970383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 971383922c3SLisandro Dalcin int color; 972b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 973b0a32e0cSBarry Smith PetscViewer viewer; 974f3ef73ceSBarry Smith PetscViewerFormat format; 975fff043a9SJunchao Zhang const PetscScalar *aa; 976cddf8d76SBarry Smith 9773a40ed3dSBarry Smith PetscFunctionBegin; 9789566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9799566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9809566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 981383922c3SLisandro Dalcin 982416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 984fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 985d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9860513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 987b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 988416022c9SBarry Smith for (i = 0; i < m; i++) { 9899371c9d4SSatish Balay y_l = m - i - 1.0; 9909371c9d4SSatish Balay y_r = y_l + 1.0; 991bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9929371c9d4SSatish Balay x_l = a->j[j]; 9939371c9d4SSatish Balay x_r = x_l + 1.0; 994fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9959566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 996cddf8d76SBarry Smith } 997cddf8d76SBarry Smith } 998b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 999cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10009371c9d4SSatish Balay y_l = m - i - 1.0; 10019371c9d4SSatish Balay y_r = y_l + 1.0; 1002bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10039371c9d4SSatish Balay x_l = a->j[j]; 10049371c9d4SSatish Balay x_r = x_l + 1.0; 1005fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1007cddf8d76SBarry Smith } 1008cddf8d76SBarry Smith } 1009b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1010cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10119371c9d4SSatish Balay y_l = m - i - 1.0; 10129371c9d4SSatish Balay y_r = y_l + 1.0; 1013bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10149371c9d4SSatish Balay x_l = a->j[j]; 10159371c9d4SSatish Balay x_r = x_l + 1.0; 1016fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10179566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1018416022c9SBarry Smith } 1019416022c9SBarry Smith } 1020d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10210513a670SBarry Smith } else { 10220513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10230513a670SBarry Smith /* first determine max of all nonzero values */ 1024b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1025383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1026b0a32e0cSBarry Smith PetscDraw popup; 10270513a670SBarry Smith 10280513a670SBarry Smith for (i = 0; i < nz; i++) { 1029fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10300513a670SBarry Smith } 1031383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10339566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1034383922c3SLisandro Dalcin 1035d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10360513a670SBarry Smith for (i = 0; i < m; i++) { 1037383922c3SLisandro Dalcin y_l = m - i - 1.0; 1038383922c3SLisandro Dalcin y_r = y_l + 1.0; 1039bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1040383922c3SLisandro Dalcin x_l = a->j[j]; 1041383922c3SLisandro Dalcin x_r = x_l + 1.0; 1042fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10439566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10440513a670SBarry Smith count++; 10450513a670SBarry Smith } 10460513a670SBarry Smith } 1047d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10480513a670SBarry Smith } 10499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1051480ef9eaSBarry Smith } 1052cddf8d76SBarry Smith 10539804daf3SBarry Smith #include <petscdraw.h> 1054d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1055d71ae5a4SJacob Faibussowitsch { 1056b0a32e0cSBarry Smith PetscDraw draw; 105736db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1058ace3abfcSBarry Smith PetscBool isnull; 1059480ef9eaSBarry Smith 1060480ef9eaSBarry Smith PetscFunctionBegin; 10619566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10629566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10633ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1064480ef9eaSBarry Smith 10659371c9d4SSatish Balay xr = A->cmap->n; 10669371c9d4SSatish Balay yr = A->rmap->n; 10679371c9d4SSatish Balay h = yr / 10.0; 10689371c9d4SSatish Balay w = xr / 10.0; 10699371c9d4SSatish Balay xr += w; 10709371c9d4SSatish Balay yr += h; 10719371c9d4SSatish Balay xl = -w; 10729371c9d4SSatish Balay yl = -h; 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10769566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10779566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1079416022c9SBarry Smith } 1080416022c9SBarry Smith 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1082d71ae5a4SJacob Faibussowitsch { 1083ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1084416022c9SBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10891baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10901baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10911baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10929566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109417ab2063SBarry Smith } 109519bcc07fSBarry Smith 1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1097d71ae5a4SJacob Faibussowitsch { 1098416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1099580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1100d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 110154f21887SBarry Smith MatScalar *aa = a->a, *ap; 11023447b6efSHong Zhang PetscReal ratio = 0.6; 110317ab2063SBarry Smith 11043a40ed3dSBarry Smith PetscFunctionBegin; 11053ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1107b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1108b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111b215bc84SStefano Zampini } 111217ab2063SBarry Smith 111343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111417ab2063SBarry Smith for (i = 1; i < m; i++) { 1115416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111617ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111794a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111817ab2063SBarry Smith if (fshift) { 1119bfeeae90SHong Zhang ip = aj + ai[i]; 1120bfeeae90SHong Zhang ap = aa + ai[i]; 112117ab2063SBarry Smith N = ailen[i]; 11229566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112417ab2063SBarry Smith } 112517ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112617ab2063SBarry Smith } 112717ab2063SBarry Smith if (m) { 112817ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112917ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 113017ab2063SBarry Smith } 113117ab2063SBarry Smith /* reset ilen and imax for each row */ 11327b083b7cSBarry Smith a->nonzerorowcnt = 0; 1133396832f4SHong Zhang if (A->structure_only) { 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1136396832f4SHong Zhang } else { /* !A->structure_only */ 113717ab2063SBarry Smith for (i = 0; i < m; i++) { 113817ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11397b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 114017ab2063SBarry Smith } 1141396832f4SHong Zhang } 1142bfeeae90SHong Zhang a->nz = ai[m]; 1143aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 114417ab2063SBarry Smith 11459566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11469566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11479566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11492205254eSKarl Rupp 11508e58a170SBarry Smith A->info.mallocs += a->reallocs; 1151dd5f02e7SSatish Balay a->reallocs = 0; 11526712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115336db0b34SBarry Smith a->rmax = rmax; 11544e220ebcSLois Curfman McInnes 115548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11569566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115817ab2063SBarry Smith } 115917ab2063SBarry Smith 1160d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1161d71ae5a4SJacob Faibussowitsch { 116299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116399cafbc1SBarry Smith PetscInt i, nz = a->nz; 11642e5835c6SStefano Zampini MatScalar *aa; 116599cafbc1SBarry Smith 116699cafbc1SBarry Smith PetscFunctionBegin; 11679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117299cafbc1SBarry Smith } 117399cafbc1SBarry Smith 1174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1175d71ae5a4SJacob Faibussowitsch { 117699cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117799cafbc1SBarry Smith PetscInt i, nz = a->nz; 11782e5835c6SStefano Zampini MatScalar *aa; 117999cafbc1SBarry Smith 118099cafbc1SBarry Smith PetscFunctionBegin; 11819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118299cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118699cafbc1SBarry Smith } 118799cafbc1SBarry Smith 1188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1189d71ae5a4SJacob Faibussowitsch { 1190fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1191fff043a9SJunchao Zhang MatScalar *aa; 11923a40ed3dSBarry Smith 11933a40ed3dSBarry Smith PetscFunctionBegin; 11949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11959566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119917ab2063SBarry Smith } 1200416022c9SBarry Smith 1201d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1202d71ae5a4SJacob Faibussowitsch { 1203cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1204cbc6b225SStefano Zampini 1205cbc6b225SStefano Zampini PetscFunctionBegin; 12069566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12079566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 12083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1209cbc6b225SStefano Zampini } 1210cbc6b225SStefano Zampini 1211d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1212d71ae5a4SJacob Faibussowitsch { 1213416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1214d5d45c9bSBarry Smith 12153a40ed3dSBarry Smith PetscFunctionBegin; 1216aa482453SBarry Smith #if defined(PETSC_USE_LOG) 12173ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 121817ab2063SBarry Smith #endif 12199566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12209566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12339566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1235901853e0SKris Buschelman 12366718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12376718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12386718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12396718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12406718818eSStefano Zampini due to different matrix sizes */ 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12426718818eSStefano Zampini 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12532e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12542e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12552e956fe4SStefano Zampini #endif 12564222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12604222ddf1SHong Zhang #endif 1261d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1262d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1264d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1265d5e393b6SSuyash Tandon #endif 12663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12683d0639e7SStefano Zampini #endif 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1270af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1272af8000cdSHong Zhang #endif 1273d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1275d24d4204SJose E. Roman #endif 127663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127963c07aadSStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12962e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130317ab2063SBarry Smith } 130417ab2063SBarry Smith 1305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1306d71ae5a4SJacob Faibussowitsch { 1307416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13083a40ed3dSBarry Smith 13093a40ed3dSBarry Smith PetscFunctionBegin; 1310a65d3064SKris Buschelman switch (op) { 1311d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1312d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1315d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1318d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1319d71ae5a4SJacob Faibussowitsch break; 1320d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1321d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1322d71ae5a4SJacob Faibussowitsch break; 1323d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1324d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1325d71ae5a4SJacob Faibussowitsch break; 1326d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1327d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1328d71ae5a4SJacob Faibussowitsch break; 1329d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1330d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1331d71ae5a4SJacob Faibussowitsch break; 13323d472b54SHong Zhang case MAT_SPD: 1333b1646e73SJed Brown case MAT_SYMMETRIC: 1334b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1335b1646e73SJed Brown case MAT_HERMITIAN: 1336b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1337957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1338b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1339b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1340b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13415021d80fSJed Brown break; 13428c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1343a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1344d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1345d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1348d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1349d71ae5a4SJacob Faibussowitsch break; 1350d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1351d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353071fcb05SBarry Smith case MAT_SORTED_FULL: 1354071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1355071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1356071fcb05SBarry Smith break; 1357d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1358d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch default: 1361d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1362a65d3064SKris Buschelman } 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136417ab2063SBarry Smith } 136517ab2063SBarry Smith 1366d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1367d71ae5a4SJacob Faibussowitsch { 1368416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1369fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1370c898d852SStefano Zampini PetscScalar *x; 1371c898d852SStefano Zampini const PetscScalar *aa; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1377d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1378d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13802c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138435e7444dSHong Zhang } 138535e7444dSHong Zhang 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138735e7444dSHong Zhang for (i = 0; i < n; i++) { 1388fdc842d1SBarry Smith x[i] = 0.0; 138935e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139035e7444dSHong Zhang if (aj[j] == i) { 139135e7444dSHong Zhang x[i] = aa[j]; 139217ab2063SBarry Smith break; 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 139517ab2063SBarry Smith } 13969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139917ab2063SBarry Smith } 140017ab2063SBarry Smith 1401c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1403d71ae5a4SJacob Faibussowitsch { 1404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14055f22a7b3SSebastian Grimberg const MatScalar *aa; 1406d9ca1df4SBarry Smith PetscScalar *y; 1407d9ca1df4SBarry Smith const PetscScalar *x; 1408d0f46423SBarry Smith PetscInt m = A->rmap->n; 14095c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14105f22a7b3SSebastian Grimberg const MatScalar *v; 1411a77337e4SBarry Smith PetscScalar alpha; 1412d9ca1df4SBarry Smith PetscInt n, i, j; 1413d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14143447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1415ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14165c897100SBarry Smith #endif 141717ab2063SBarry Smith 14183a40ed3dSBarry Smith PetscFunctionBegin; 14199566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14219566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14235c897100SBarry Smith 14245c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1425fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14265c897100SBarry Smith #else 14273447b6efSHong Zhang if (usecprow) { 14283447b6efSHong Zhang m = cprow.nrows; 14293447b6efSHong Zhang ii = cprow.i; 14307b2bb3b9SHong Zhang ridx = cprow.rindex; 14313447b6efSHong Zhang } else { 14323447b6efSHong Zhang ii = a->i; 14333447b6efSHong Zhang } 143417ab2063SBarry Smith for (i = 0; i < m; i++) { 14353447b6efSHong Zhang idx = a->j + ii[i]; 1436fff043a9SJunchao Zhang v = aa + ii[i]; 14373447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14383447b6efSHong Zhang if (usecprow) { 14397b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14403447b6efSHong Zhang } else { 144117ab2063SBarry Smith alpha = x[i]; 14423447b6efSHong Zhang } 144304fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144417ab2063SBarry Smith } 14455c897100SBarry Smith #endif 14469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145117ab2063SBarry Smith } 145217ab2063SBarry Smith 1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1454d71ae5a4SJacob Faibussowitsch { 14555c897100SBarry Smith PetscFunctionBegin; 14569566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14579566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14595c897100SBarry Smith } 14605c897100SBarry Smith 1461c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146278b84d54SShri Abhyankar 1463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1464d71ae5a4SJacob Faibussowitsch { 1465416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1466d9fead3dSBarry Smith PetscScalar *y; 146754f21887SBarry Smith const PetscScalar *x; 1468fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1469003131ecSBarry Smith PetscInt m = A->rmap->n; 14700298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14717b083b7cSBarry Smith PetscInt n, i; 1472362ced78SSatish Balay PetscScalar sum; 1473ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147417ab2063SBarry Smith 1475b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147697952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1477fee21e36SBarry Smith #endif 1478fee21e36SBarry Smith 14793a40ed3dSBarry Smith PetscFunctionBegin; 1480b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14819566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1483b215bc84SStefano Zampini } 14849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14869566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1487416022c9SBarry Smith ii = a->i; 14884eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14899566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149097952fefSHong Zhang m = a->compressedrow.nrows; 149197952fefSHong Zhang ii = a->compressedrow.i; 149297952fefSHong Zhang ridx = a->compressedrow.rindex; 149397952fefSHong Zhang for (i = 0; i < m; i++) { 149497952fefSHong Zhang n = ii[i + 1] - ii[i]; 149597952fefSHong Zhang aj = a->j + ii[i]; 1496fff043a9SJunchao Zhang aa = a_a + ii[i]; 149797952fefSHong Zhang sum = 0.0; 1498003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1499003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150097952fefSHong Zhang y[*ridx++] = sum; 150197952fefSHong Zhang } 150297952fefSHong Zhang } else { /* do not use compressed row format */ 1503b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15043d3eaba7SBarry Smith aj = a->j; 1505fff043a9SJunchao Zhang aa = a_a; 1506b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1507b05257ddSBarry Smith #else 150817ab2063SBarry Smith for (i = 0; i < m; i++) { 1509003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1510003131ecSBarry Smith aj = a->j + ii[i]; 1511fff043a9SJunchao Zhang aa = a_a + ii[i]; 151217ab2063SBarry Smith sum = 0.0; 1513003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151417ab2063SBarry Smith y[i] = sum; 151517ab2063SBarry Smith } 15168d195f9aSBarry Smith #endif 1517b05257ddSBarry Smith } 15189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 1525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1526d71ae5a4SJacob Faibussowitsch { 1527b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1528b434eb95SMatthew G. Knepley PetscScalar *y; 1529b434eb95SMatthew G. Knepley const PetscScalar *x; 1530fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1531b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1532b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1533b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1534b434eb95SMatthew G. Knepley PetscScalar sum; 1535b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1536b434eb95SMatthew G. Knepley 1537b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1538b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1539b434eb95SMatthew G. Knepley #endif 1540b434eb95SMatthew G. Knepley 1541b434eb95SMatthew G. Knepley PetscFunctionBegin; 15429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1545b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1546b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1547b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1548b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1557b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1558b434eb95SMatthew G. Knepley } 1559b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15603d3eaba7SBarry Smith ii = a->i; 1561b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1562b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1563b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1564fff043a9SJunchao Zhang aa = a_a + ii[i]; 1565b434eb95SMatthew G. Knepley sum = 0.0; 1566b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1567b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1568b434eb95SMatthew G. Knepley y[i] = sum; 1569b434eb95SMatthew G. Knepley } 1570b434eb95SMatthew G. Knepley } 15719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1576b434eb95SMatthew G. Knepley } 1577b434eb95SMatthew G. Knepley 1578d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1579d71ae5a4SJacob Faibussowitsch { 1580b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1581b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1582b434eb95SMatthew G. Knepley const PetscScalar *x; 1583fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1584b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1585b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1586b434eb95SMatthew G. Knepley PetscScalar sum; 1587b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1588b434eb95SMatthew G. Knepley 1589b434eb95SMatthew G. Knepley PetscFunctionBegin; 15909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15919566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15929566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1593b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159448a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1595b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1596b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1597b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1598b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1599b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1600b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1601fff043a9SJunchao Zhang aa = a_a + ii[i]; 1602b434eb95SMatthew G. Knepley sum = y[*ridx]; 1603b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1604b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1605b434eb95SMatthew G. Knepley } 1606b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16073d3eaba7SBarry Smith ii = a->i; 1608b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1609b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1610b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1611fff043a9SJunchao Zhang aa = a_a + ii[i]; 1612b434eb95SMatthew G. Knepley sum = y[i]; 1613b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1614b434eb95SMatthew G. Knepley z[i] = sum; 1615b434eb95SMatthew G. Knepley } 1616b434eb95SMatthew G. Knepley } 16179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1622b434eb95SMatthew G. Knepley } 1623b434eb95SMatthew G. Knepley 1624c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1626d71ae5a4SJacob Faibussowitsch { 1627416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1628f15663dcSBarry Smith PetscScalar *y, *z; 1629f15663dcSBarry Smith const PetscScalar *x; 1630fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1631d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1632d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1633362ced78SSatish Balay PetscScalar sum; 1634ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16359ea0dfa2SSatish Balay 16363a40ed3dSBarry Smith PetscFunctionBegin; 1637b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16389566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1640b215bc84SStefano Zampini } 16419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16429566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16439566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16444eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164548a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164697952fefSHong Zhang m = a->compressedrow.nrows; 164797952fefSHong Zhang ii = a->compressedrow.i; 164897952fefSHong Zhang ridx = a->compressedrow.rindex; 164997952fefSHong Zhang for (i = 0; i < m; i++) { 165097952fefSHong Zhang n = ii[i + 1] - ii[i]; 165197952fefSHong Zhang aj = a->j + ii[i]; 1652fff043a9SJunchao Zhang aa = a_a + ii[i]; 165397952fefSHong Zhang sum = y[*ridx]; 1654f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165597952fefSHong Zhang z[*ridx++] = sum; 165697952fefSHong Zhang } 165797952fefSHong Zhang } else { /* do not use compressed row format */ 16583d3eaba7SBarry Smith ii = a->i; 1659f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16603d3eaba7SBarry Smith aj = a->j; 1661fff043a9SJunchao Zhang aa = a_a; 1662f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1663f15663dcSBarry Smith #else 166417ab2063SBarry Smith for (i = 0; i < m; i++) { 1665f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1666f15663dcSBarry Smith aj = a->j + ii[i]; 1667fff043a9SJunchao Zhang aa = a_a + ii[i]; 166817ab2063SBarry Smith sum = y[i]; 1669f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167017ab2063SBarry Smith z[i] = sum; 167117ab2063SBarry Smith } 167202ab625aSSatish Balay #endif 1673f15663dcSBarry Smith } 16749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167917ab2063SBarry Smith } 168017ab2063SBarry Smith 168117ab2063SBarry Smith /* 168217ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168317ab2063SBarry Smith */ 1684d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1685d71ae5a4SJacob Faibussowitsch { 1686416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1687d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1688c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168917ab2063SBarry Smith 16903a40ed3dSBarry Smith PetscFunctionBegin; 169109f38230SBarry Smith if (!a->diag) { 16929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1693c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169409f38230SBarry Smith } 1695d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1696c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1697c0c07093SJunchao Zhang if (alreadySet) { 1698c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1699c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1700c0c07093SJunchao Zhang } 1701c0c07093SJunchao Zhang 170209f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1703bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1704bfeeae90SHong Zhang if (a->j[j] == i) { 170509f38230SBarry Smith a->diag[i] = j; 170617ab2063SBarry Smith break; 170717ab2063SBarry Smith } 170817ab2063SBarry Smith } 170917ab2063SBarry Smith } 17103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171117ab2063SBarry Smith } 171217ab2063SBarry Smith 1713d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1714d71ae5a4SJacob Faibussowitsch { 171561ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171661ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171761ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171861ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171961ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172061ecd0c6SBarry Smith 172161ecd0c6SBarry Smith PetscFunctionBegin; 172261ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17249566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith 172861ecd0c6SBarry Smith if (a->diagonaldense) { 172961ecd0c6SBarry Smith cnt = 0; 173061ecd0c6SBarry Smith } else { 17319566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1733349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173461ecd0c6SBarry Smith cnt++; 173561ecd0c6SBarry Smith mdiag[i] = 1; 173661ecd0c6SBarry Smith } 173761ecd0c6SBarry Smith } 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith if (!cnt) { 17409566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174161ecd0c6SBarry Smith } else { 1742b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1743b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174461ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 174561ecd0c6SBarry Smith 174661ecd0c6SBarry Smith a->a = NULL; 174761ecd0c6SBarry Smith a->j = NULL; 174861ecd0c6SBarry Smith a->i = NULL; 174961ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1750ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175261ecd0c6SBarry Smith 175361ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17559566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 175648a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1757447d62f5SStefano Zampini } 17589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176061ecd0c6SBarry Smith if (singlemalloc) { 17619566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176261ecd0c6SBarry Smith } else { 17639566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17649566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17659566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 176661ecd0c6SBarry Smith } 176761ecd0c6SBarry Smith } 17689566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176961ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177161ecd0c6SBarry Smith } 177261ecd0c6SBarry Smith 1773be5855fcSBarry Smith /* 1774be5855fcSBarry Smith Checks for missing diagonals 1775be5855fcSBarry Smith */ 1776d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1777d71ae5a4SJacob Faibussowitsch { 1778be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17797734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1780be5855fcSBarry Smith 1781be5855fcSBarry Smith PetscFunctionBegin; 178209f38230SBarry Smith *missing = PETSC_FALSE; 17837734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 178409f38230SBarry Smith *missing = PETSC_TRUE; 178509f38230SBarry Smith if (d) *d = 0; 17869566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178709f38230SBarry Smith } else { 178801445905SHong Zhang PetscInt n; 178901445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1790f1e2ffcdSBarry Smith diag = a->diag; 179101445905SHong Zhang for (i = 0; i < n; i++) { 17927734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179309f38230SBarry Smith *missing = PETSC_TRUE; 179409f38230SBarry Smith if (d) *d = i; 17959566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1796358d2f5dSShri Abhyankar break; 179709f38230SBarry Smith } 1798be5855fcSBarry Smith } 1799be5855fcSBarry Smith } 18003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1801be5855fcSBarry Smith } 1802be5855fcSBarry Smith 18030da83c2eSBarry Smith #include <petscblaslapack.h> 18040da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18050da83c2eSBarry Smith 18060da83c2eSBarry Smith /* 18070da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18080da83c2eSBarry Smith */ 1809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1810d71ae5a4SJacob Faibussowitsch { 18110da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18120da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18130da83c2eSBarry Smith const PetscReal shift = 0.0; 18140da83c2eSBarry Smith PetscInt ipvt[5]; 18154e208921SJed Brown PetscCount flops = 0; 18160da83c2eSBarry Smith PetscScalar work[25], *v_work; 18170da83c2eSBarry Smith 18180da83c2eSBarry Smith PetscFunctionBegin; 18190da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18200da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182108401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1822ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 182448a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18250da83c2eSBarry Smith ncnt = 0; 18260da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18270da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18290da83c2eSBarry Smith switch (bsizes[i]) { 1830d71ae5a4SJacob Faibussowitsch case 1: 1831d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1832d71ae5a4SJacob Faibussowitsch break; 18330da83c2eSBarry Smith case 2: 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18350da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18370da83c2eSBarry Smith break; 18380da83c2eSBarry Smith case 3: 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18400da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18420da83c2eSBarry Smith break; 18430da83c2eSBarry Smith case 4: 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18450da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18470da83c2eSBarry Smith break; 18480da83c2eSBarry Smith case 5: 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18500da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18520da83c2eSBarry Smith break; 18530da83c2eSBarry Smith case 6: 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18550da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18570da83c2eSBarry Smith break; 18580da83c2eSBarry Smith case 7: 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18600da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18620da83c2eSBarry Smith break; 18630da83c2eSBarry Smith default: 18649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18650da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18670da83c2eSBarry Smith } 18680da83c2eSBarry Smith ncnt += bsizes[i]; 18690da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18704e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18710da83c2eSBarry Smith } 18723ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187348a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18749566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18760da83c2eSBarry Smith } 18770da83c2eSBarry Smith 1878422a814eSBarry Smith /* 1879422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1880422a814eSBarry Smith */ 1881d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1882d71ae5a4SJacob Faibussowitsch { 188371f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1884d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18852e5835c6SStefano Zampini const MatScalar *v; 188654f21887SBarry Smith PetscScalar *idiag, *mdiag; 188771f1c65dSBarry Smith 188871f1c65dSBarry Smith PetscFunctionBegin; 18893ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18909566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189171f1c65dSBarry Smith diag = a->diag; 18924dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18932e5835c6SStefano Zampini 189471f1c65dSBarry Smith mdiag = a->mdiag; 189571f1c65dSBarry Smith idiag = a->idiag; 18969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1897422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189871f1c65dSBarry Smith for (i = 0; i < m; i++) { 189971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1900899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1901899639b0SHong Zhang if (PetscRealPart(fshift)) { 19029566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19037b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19047b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19057b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 190698921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1907899639b0SHong Zhang } 190871f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190971f1c65dSBarry Smith } 19109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191171f1c65dSBarry Smith } else { 191271f1c65dSBarry Smith for (i = 0; i < m; i++) { 191371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 191471f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 191571f1c65dSBarry Smith } 19169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191771f1c65dSBarry Smith } 191871f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192171f1c65dSBarry Smith } 192271f1c65dSBarry Smith 1923c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1924d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1925d71ae5a4SJacob Faibussowitsch { 1926416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1927e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19282e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192954f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19303d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193197f1f81fSBarry Smith const PetscInt *idx, *diag; 193217ab2063SBarry Smith 19333a40ed3dSBarry Smith PetscFunctionBegin; 1934b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19359566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1937b215bc84SStefano Zampini } 1938b965ef7fSBarry Smith its = its * lits; 193991723122SBarry Smith 194071f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19419566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194271f1c65dSBarry Smith a->fshift = fshift; 194371f1c65dSBarry Smith a->omega = omega; 1944ed480e8bSBarry Smith 194571f1c65dSBarry Smith diag = a->diag; 194671f1c65dSBarry Smith t = a->ssor_work; 1947ed480e8bSBarry Smith idiag = a->idiag; 194871f1c65dSBarry Smith mdiag = a->mdiag; 1949ed480e8bSBarry Smith 19509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19519566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19529566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1953ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195417ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195517ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1956ed480e8bSBarry Smith bs = b; 195717ab2063SBarry Smith for (i = 0; i < m; i++) { 195871f1c65dSBarry Smith d = fshift + mdiag[i]; 1959416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1960ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19612e5835c6SStefano Zampini v = aa + diag[i] + 1; 196217ab2063SBarry Smith sum = b[i] * d / omega; 1963003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196417ab2063SBarry Smith x[i] = sum; 196517ab2063SBarry Smith } 19669566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19679566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19699566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197117ab2063SBarry Smith } 1972c783ea89SBarry Smith 197308401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1974f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19754c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1976887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 197717ab2063SBarry Smith 197817ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197917ab2063SBarry Smith 1980887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198117ab2063SBarry Smith */ 198217ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198317ab2063SBarry Smith 198417ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198517ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1986416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1987ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19882e5835c6SStefano Zampini v = aa + diag[i] + 1; 198917ab2063SBarry Smith sum = b[i]; 1990e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1991ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199217ab2063SBarry Smith } 199317ab2063SBarry Smith 199417ab2063SBarry Smith /* t = b - (2*E - D)x */ 19952e5835c6SStefano Zampini v = aa; 19962205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 199717ab2063SBarry Smith 199817ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1999ed480e8bSBarry Smith ts = t; 2000416022c9SBarry Smith diag = a->diag; 200117ab2063SBarry Smith for (i = 0; i < m; i++) { 2002416022c9SBarry Smith n = diag[i] - a->i[i]; 2003ed480e8bSBarry Smith idx = a->j + a->i[i]; 20042e5835c6SStefano Zampini v = aa + a->i[i]; 200517ab2063SBarry Smith sum = t[i]; 2006003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2007ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2008733d66baSBarry Smith /* x = x + t */ 2009733d66baSBarry Smith x[i] += t[i]; 201017ab2063SBarry Smith } 201117ab2063SBarry Smith 20129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20139566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20149566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 201617ab2063SBarry Smith } 201717ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201817ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201917ab2063SBarry Smith for (i = 0; i < m; i++) { 2020416022c9SBarry Smith n = diag[i] - a->i[i]; 2021ed480e8bSBarry Smith idx = a->j + a->i[i]; 20222e5835c6SStefano Zampini v = aa + a->i[i]; 202317ab2063SBarry Smith sum = b[i]; 2024e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20255c99c7daSBarry Smith t[i] = sum; 2026ed480e8bSBarry Smith x[i] = sum * idiag[i]; 202717ab2063SBarry Smith } 20285c99c7daSBarry Smith xb = t; 20299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20303a40ed3dSBarry Smith } else xb = b; 203117ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203217ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2033416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2034ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20352e5835c6SStefano Zampini v = aa + diag[i] + 1; 203617ab2063SBarry Smith sum = xb[i]; 2037e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20385c99c7daSBarry Smith if (xb == b) { 2039ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20405c99c7daSBarry Smith } else { 2041b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204217ab2063SBarry Smith } 20435c99c7daSBarry Smith } 20449566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204517ab2063SBarry Smith } 204617ab2063SBarry Smith its--; 204717ab2063SBarry Smith } 204817ab2063SBarry Smith while (its--) { 204917ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205017ab2063SBarry Smith for (i = 0; i < m; i++) { 2051b19a5dc2SMark Adams /* lower */ 2052b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2053ed480e8bSBarry Smith idx = a->j + a->i[i]; 20542e5835c6SStefano Zampini v = aa + a->i[i]; 205517ab2063SBarry Smith sum = b[i]; 2056e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2057b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2058b19a5dc2SMark Adams /* upper */ 2059b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2060b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20612e5835c6SStefano Zampini v = aa + diag[i] + 1; 2062b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2063b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206417ab2063SBarry Smith } 2065b19a5dc2SMark Adams xb = t; 20669566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2067b19a5dc2SMark Adams } else xb = b; 206817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2070b19a5dc2SMark Adams sum = xb[i]; 2071b19a5dc2SMark Adams if (xb == b) { 2072b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2073416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2074ed480e8bSBarry Smith idx = a->j + a->i[i]; 20752e5835c6SStefano Zampini v = aa + a->i[i]; 2076e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2077ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2078b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2079b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2080b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20812e5835c6SStefano Zampini v = aa + diag[i] + 1; 2082b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2083b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208417ab2063SBarry Smith } 2085b19a5dc2SMark Adams } 2086b19a5dc2SMark Adams if (xb == b) { 20879566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2088b19a5dc2SMark Adams } else { 20899566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2090b19a5dc2SMark Adams } 209117ab2063SBarry Smith } 209217ab2063SBarry Smith } 20939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20949566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20959566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 209717ab2063SBarry Smith } 209817ab2063SBarry Smith 2099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2100d71ae5a4SJacob Faibussowitsch { 2101416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21024e220ebcSLois Curfman McInnes 21033a40ed3dSBarry Smith PetscFunctionBegin; 21044e220ebcSLois Curfman McInnes info->block_size = 1.0; 21053966268fSBarry Smith info->nz_allocated = a->maxnz; 21063966268fSBarry Smith info->nz_used = a->nz; 21073966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21083966268fSBarry Smith info->assemblies = A->num_ass; 21093966268fSBarry Smith info->mallocs = A->info.mallocs; 21104dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2111d5f3da31SBarry Smith if (A->factortype) { 21124e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21134e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21144e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21154e220ebcSLois Curfman McInnes } else { 21164e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21174e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21184e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21194e220ebcSLois Curfman McInnes } 21203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212117ab2063SBarry Smith } 212217ab2063SBarry Smith 2123d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2124d71ae5a4SJacob Faibussowitsch { 2125416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2126c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 212797b48c8fSBarry Smith const PetscScalar *xx; 21282e5835c6SStefano Zampini PetscScalar *bb, *aa; 2129c7da8527SEric Chamberland PetscInt d = 0; 213017ab2063SBarry Smith 21313a40ed3dSBarry Smith PetscFunctionBegin; 213297b48c8fSBarry Smith if (x && b) { 21339566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21349566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213597b48c8fSBarry Smith for (i = 0; i < N; i++) { 2136aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2137447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213897b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213997b48c8fSBarry Smith } 21409566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21419566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214297b48c8fSBarry Smith } 214397b48c8fSBarry Smith 21449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2145a9817697SBarry Smith if (a->keepnonzeropattern) { 2146f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2147aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21489566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2149f1e2ffcdSBarry Smith } 2150f4df32b1SMatthew Knepley if (diag != 0.0) { 2151c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2152c7da8527SEric Chamberland d = rows[i]; 2153447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215408401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2155c7da8527SEric Chamberland } 2156f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2157447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21582e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2159f1e2ffcdSBarry Smith } 2160f1e2ffcdSBarry Smith } 2161f1e2ffcdSBarry Smith } else { 2162f4df32b1SMatthew Knepley if (diag != 0.0) { 216317ab2063SBarry Smith for (i = 0; i < N; i++) { 2164aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21657ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2166447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2167447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2168447d62f5SStefano Zampini } else { 2169416022c9SBarry Smith a->ilen[rows[i]] = 1; 21702e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2171bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2172447d62f5SStefano Zampini } 2173447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21749566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217517ab2063SBarry Smith } 217617ab2063SBarry Smith } 21773a40ed3dSBarry Smith } else { 217817ab2063SBarry Smith for (i = 0; i < N; i++) { 2179aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2180416022c9SBarry Smith a->ilen[rows[i]] = 0; 218117ab2063SBarry Smith } 218217ab2063SBarry Smith } 2183e56f5c9eSBarry Smith A->nonzerostate++; 2184f1e2ffcdSBarry Smith } 21859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2186dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218817ab2063SBarry Smith } 218917ab2063SBarry Smith 2190d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2191d71ae5a4SJacob Faibussowitsch { 21926e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21936e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21942b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21956e169961SBarry Smith const PetscScalar *xx; 21962e5835c6SStefano Zampini PetscScalar *bb, *aa; 21976e169961SBarry Smith 21986e169961SBarry Smith PetscFunctionBegin; 21993ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22016e169961SBarry Smith if (x && b) { 22029566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22039566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22042b40b63fSBarry Smith vecs = PETSC_TRUE; 22056e169961SBarry Smith } 22069566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22076e169961SBarry Smith for (i = 0; i < N; i++) { 2208aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 22102205254eSKarl Rupp 22116e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22126e169961SBarry Smith } 22136e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22146e169961SBarry Smith if (!zeroed[i]) { 22156e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22164cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22172e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22182e5835c6SStefano Zampini aa[j] = 0.0; 22196e169961SBarry Smith } 22206e169961SBarry Smith } 22214cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22226e169961SBarry Smith } 22236e169961SBarry Smith if (x && b) { 22249566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22259566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22266e169961SBarry Smith } 22279566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22286e169961SBarry Smith if (diag != 0.0) { 22299566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22301d5a398dSstefano_zampini if (missing) { 22311d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22324cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2233aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22349566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22351d5a398dSstefano_zampini } 22361d5a398dSstefano_zampini } else { 2237ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22386e169961SBarry Smith } 22391d5a398dSstefano_zampini } 22409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2241dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22436e169961SBarry Smith } 22446e169961SBarry Smith 2245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2246d71ae5a4SJacob Faibussowitsch { 2247fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2248fff043a9SJunchao Zhang const PetscScalar *aa; 2249fff043a9SJunchao Zhang PetscInt *itmp; 225017ab2063SBarry Smith 22513a40ed3dSBarry Smith PetscFunctionBegin; 22529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2253416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22542e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 225517ab2063SBarry Smith if (idx) { 2256bfeeae90SHong Zhang itmp = a->j + a->i[row]; 225726fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2258f4259b30SLisandro Dalcin else *idx = NULL; 225917ab2063SBarry Smith } 22609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226217ab2063SBarry Smith } 226317ab2063SBarry Smith 2264d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2265d71ae5a4SJacob Faibussowitsch { 22663a40ed3dSBarry Smith PetscFunctionBegin; 2267cb4a9cd9SHong Zhang if (nz) *nz = 0; 22682e5835c6SStefano Zampini if (idx) *idx = NULL; 22692e5835c6SStefano Zampini if (v) *v = NULL; 22703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227117ab2063SBarry Smith } 227217ab2063SBarry Smith 2273d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2274d71ae5a4SJacob Faibussowitsch { 2275416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22762e5835c6SStefano Zampini const MatScalar *v; 227736db0b34SBarry Smith PetscReal sum = 0.0; 227897f1f81fSBarry Smith PetscInt i, j; 227917ab2063SBarry Smith 22803a40ed3dSBarry Smith PetscFunctionBegin; 22819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228217ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2283570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2284570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2285792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2286570b7f6dSBarry Smith #else 2287416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22889371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22899371c9d4SSatish Balay v++; 229017ab2063SBarry Smith } 22918f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2292570b7f6dSBarry Smith #endif 22939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22943a40ed3dSBarry Smith } else if (type == NORM_1) { 229536db0b34SBarry Smith PetscReal *tmp; 229697f1f81fSBarry Smith PetscInt *jj = a->j; 22979566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2298064f8208SBarry Smith *nrm = 0.0; 2299416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23009371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23019371c9d4SSatish Balay v++; 230217ab2063SBarry Smith } 2303d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2304064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230517ab2063SBarry Smith } 23069566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23083a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2309064f8208SBarry Smith *nrm = 0.0; 2310d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23112e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 231217ab2063SBarry Smith sum = 0.0; 2313416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23149371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23159371c9d4SSatish Balay v2++; 231617ab2063SBarry Smith } 2317064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231817ab2063SBarry Smith } 23199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2320f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232317ab2063SBarry Smith } 232417ab2063SBarry Smith 2325d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2326d71ae5a4SJacob Faibussowitsch { 23273d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232854f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23292e5835c6SStefano Zampini const MatScalar *va, *vb; 233097f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2331cd0d46ebSvictorle 2332cd0d46ebSvictorle PetscFunctionBegin; 23339566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23349566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23355485867bSBarry Smith if (ma != nb || na != mb) { 23365485867bSBarry Smith *f = PETSC_FALSE; 23373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23385485867bSBarry Smith } 23399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23419371c9d4SSatish Balay aii = aij->i; 23429371c9d4SSatish Balay bii = bij->i; 23439371c9d4SSatish Balay adx = aij->j; 23449371c9d4SSatish Balay bdx = bij->j; 23459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2347cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2348cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2349cd0d46ebSvictorle 2350cd0d46ebSvictorle *f = PETSC_TRUE; 2351cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2352cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235397f1f81fSBarry Smith PetscInt idc, idr; 23545485867bSBarry Smith PetscScalar vc, vr; 2355cd0d46ebSvictorle /* column/row index/value */ 23565485867bSBarry Smith idc = adx[aptr[i]]; 23575485867bSBarry Smith idr = bdx[bptr[idc]]; 23585485867bSBarry Smith vc = va[aptr[i]]; 23595485867bSBarry Smith vr = vb[bptr[idc]]; 23605485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23615485867bSBarry Smith *f = PETSC_FALSE; 23625485867bSBarry Smith goto done; 2363cd0d46ebSvictorle } else { 23645485867bSBarry Smith aptr[i]++; 23655485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2366cd0d46ebSvictorle } 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle } 2369cd0d46ebSvictorle done: 23709566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23719566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2375cd0d46ebSvictorle } 2376cd0d46ebSvictorle 2377d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2378d71ae5a4SJacob Faibussowitsch { 23793d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238054f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238154f21887SBarry Smith MatScalar *va, *vb; 23821cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23831cbb95d3SBarry Smith 23841cbb95d3SBarry Smith PetscFunctionBegin; 23859566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23869566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23871cbb95d3SBarry Smith if (ma != nb || na != mb) { 23881cbb95d3SBarry Smith *f = PETSC_FALSE; 23893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23901cbb95d3SBarry Smith } 23919371c9d4SSatish Balay aii = aij->i; 23929371c9d4SSatish Balay bii = bij->i; 23939371c9d4SSatish Balay adx = aij->j; 23949371c9d4SSatish Balay bdx = bij->j; 23959371c9d4SSatish Balay va = aij->a; 23969371c9d4SSatish Balay vb = bij->a; 23979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23991cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24001cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24011cbb95d3SBarry Smith 24021cbb95d3SBarry Smith *f = PETSC_TRUE; 24031cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24041cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24051cbb95d3SBarry Smith PetscInt idc, idr; 24061cbb95d3SBarry Smith PetscScalar vc, vr; 24071cbb95d3SBarry Smith /* column/row index/value */ 24081cbb95d3SBarry Smith idc = adx[aptr[i]]; 24091cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24101cbb95d3SBarry Smith vc = va[aptr[i]]; 24111cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24121cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24131cbb95d3SBarry Smith *f = PETSC_FALSE; 24141cbb95d3SBarry Smith goto done; 24151cbb95d3SBarry Smith } else { 24161cbb95d3SBarry Smith aptr[i]++; 24171cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24181cbb95d3SBarry Smith } 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith } 24211cbb95d3SBarry Smith done: 24229566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24239566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24251cbb95d3SBarry Smith } 24261cbb95d3SBarry Smith 2427d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2428d71ae5a4SJacob Faibussowitsch { 24299e29f15eSvictorle PetscFunctionBegin; 24309566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24329e29f15eSvictorle } 24339e29f15eSvictorle 2434d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2435d71ae5a4SJacob Faibussowitsch { 24361cbb95d3SBarry Smith PetscFunctionBegin; 24379566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24391cbb95d3SBarry Smith } 24401cbb95d3SBarry Smith 2441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2442d71ae5a4SJacob Faibussowitsch { 2443416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2444fff8e43fSBarry Smith const PetscScalar *l, *r; 2445fff8e43fSBarry Smith PetscScalar x; 244654f21887SBarry Smith MatScalar *v; 2447fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2448fff8e43fSBarry Smith const PetscInt *jj; 244917ab2063SBarry Smith 24503a40ed3dSBarry Smith PetscFunctionBegin; 245117ab2063SBarry Smith if (ll) { 24523ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24533ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24549566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 245508401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24569566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 245817ab2063SBarry Smith for (i = 0; i < m; i++) { 245917ab2063SBarry Smith x = l[i]; 2460416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24612205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 246217ab2063SBarry Smith } 24639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24649566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 246617ab2063SBarry Smith } 246717ab2063SBarry Smith if (rr) { 24689566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 246908401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24709566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24722e5835c6SStefano Zampini jj = a->j; 24732205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 247717ab2063SBarry Smith } 24789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 248017ab2063SBarry Smith } 248117ab2063SBarry Smith 2482d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2483d71ae5a4SJacob Faibussowitsch { 2484db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2485d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 248697f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24875d0c19d7SBarry Smith const PetscInt *irow, *icol; 24882e5835c6SStefano Zampini const PetscScalar *aa; 24895d0c19d7SBarry Smith PetscInt nrows, ncols; 249097f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2491fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2492416022c9SBarry Smith Mat C; 2493cdc6f3adSToby Isaac PetscBool stride; 249417ab2063SBarry Smith 24953a40ed3dSBarry Smith PetscFunctionBegin; 24969566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24979566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24989566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 249917ab2063SBarry Smith 25009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2501ff718158SBarry Smith if (stride) { 25029566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2503ff718158SBarry Smith } else { 2504ff718158SBarry Smith first = 0; 2505ff718158SBarry Smith step = 0; 2506ff718158SBarry Smith } 2507fee21e36SBarry Smith if (stride && step == 1) { 250802834360SBarry Smith /* special case of contiguous rows */ 25099566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 251002834360SBarry Smith /* loop over new rows determining lens and starting points */ 251102834360SBarry Smith for (i = 0; i < nrows; i++) { 2512bfeeae90SHong Zhang kstart = ai[irow[i]]; 2513a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2514a91a9bebSLisandro Dalcin starts[i] = kstart; 251502834360SBarry Smith for (k = kstart; k < kend; k++) { 2516bfeeae90SHong Zhang if (aj[k] >= first) { 251702834360SBarry Smith starts[i] = k; 251802834360SBarry Smith break; 251902834360SBarry Smith } 252002834360SBarry Smith } 2521a2744918SBarry Smith sum = 0; 252202834360SBarry Smith while (k < kend) { 2523bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2524a2744918SBarry Smith sum++; 252502834360SBarry Smith } 2526a2744918SBarry Smith lens[i] = sum; 252702834360SBarry Smith } 252802834360SBarry Smith /* create submatrix */ 2529cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 253097f1f81fSBarry Smith PetscInt n_cols, n_rows; 25319566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2532aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25339566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 253408480c60SBarry Smith C = *B; 25353a40ed3dSBarry Smith } else { 25363bef6203SJed Brown PetscInt rbs, cbs; 25379566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25399566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25409566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25419566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25429566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 254408480c60SBarry Smith } 2545db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2546db02288aSLois Curfman McInnes 254702834360SBarry Smith /* loop over rows inserting into submatrix */ 2548fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2549db02288aSLois Curfman McInnes j_new = c->j; 2550db02288aSLois Curfman McInnes i_new = c->i; 25519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 255202834360SBarry Smith for (i = 0; i < nrows; i++) { 2553a2744918SBarry Smith ii = starts[i]; 2554a2744918SBarry Smith lensi = lens[i]; 2555ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25569566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2557a2744918SBarry Smith a_new += lensi; 2558a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2559a2744918SBarry Smith c->ilen[i] = lensi; 256002834360SBarry Smith } 2561fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25639566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25643a40ed3dSBarry Smith } else { 25659566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25669566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25684dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25696bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25704dcab191SBarry Smith smap[icol[i]] = i + 1; 25714dcab191SBarry Smith } 25724dcab191SBarry Smith 257302834360SBarry Smith /* determine lens of each row */ 257402834360SBarry Smith for (i = 0; i < nrows; i++) { 2575bfeeae90SHong Zhang kstart = ai[irow[i]]; 257602834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 257702834360SBarry Smith lens[i] = 0; 257802834360SBarry Smith for (k = kstart; k < kend; k++) { 2579ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 258002834360SBarry Smith } 258102834360SBarry Smith } 258217ab2063SBarry Smith /* Create and fill new matrix */ 2583a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2584ace3abfcSBarry Smith PetscBool equal; 25850f5bd95cSBarry Smith 258699141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2587aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25889566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 258928b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25909566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 259108480c60SBarry Smith C = *B; 25923a40ed3dSBarry Smith } else { 25933bef6203SJed Brown PetscInt rbs, cbs; 25949566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25959566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25969566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25979566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25989566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25999566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 26009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 260108480c60SBarry Smith } 26029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2603fb3c7e2dSJunchao Zhang 260499141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2605fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 260617ab2063SBarry Smith for (i = 0; i < nrows; i++) { 260799141d43SSatish Balay row = irow[i]; 2608bfeeae90SHong Zhang kstart = ai[row]; 260999141d43SSatish Balay kend = kstart + a->ilen[row]; 2610bfeeae90SHong Zhang mat_i = c->i[i]; 261199141d43SSatish Balay mat_j = c->j + mat_i; 2612fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 261399141d43SSatish Balay mat_ilen = c->ilen + i; 261417ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2615bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2616ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26172e5835c6SStefano Zampini *mat_a++ = aa[k]; 261899141d43SSatish Balay (*mat_ilen)++; 261917ab2063SBarry Smith } 262017ab2063SBarry Smith } 262117ab2063SBarry Smith } 26229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 262302834360SBarry Smith /* Free work space */ 26249566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26259566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26269566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2627cdc6f3adSToby Isaac /* sort */ 2628cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2629cdc6f3adSToby Isaac PetscInt ilen; 2630cdc6f3adSToby Isaac 2631cdc6f3adSToby Isaac mat_i = c->i[i]; 2632cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2633fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 2634cdc6f3adSToby Isaac ilen = c->ilen[i]; 26359566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2636cdc6f3adSToby Isaac } 2637fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 263802834360SBarry Smith } 26398c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26409566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2641305c6ccfSStefano Zampini #endif 26429566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26439566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 264417ab2063SBarry Smith 26459566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2646416022c9SBarry Smith *B = C; 26473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264817ab2063SBarry Smith } 264917ab2063SBarry Smith 2650d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2651d71ae5a4SJacob Faibussowitsch { 265282d44351SHong Zhang Mat B; 265382d44351SHong Zhang 265482d44351SHong Zhang PetscFunctionBegin; 2655c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26569566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26579566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26589566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26599566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26609566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 266182d44351SHong Zhang *subMat = B; 2662c2d650bdSHong Zhang } else { 26639566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2664c2d650bdSHong Zhang } 26653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 266682d44351SHong Zhang } 266782d44351SHong Zhang 2668d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2669d71ae5a4SJacob Faibussowitsch { 267063b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 267163b91edcSBarry Smith Mat outA; 2672ace3abfcSBarry Smith PetscBool row_identity, col_identity; 267363b91edcSBarry Smith 26743a40ed3dSBarry Smith PetscFunctionBegin; 267508401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26761df811f5SHong Zhang 26779566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26789566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2679a871dcd8SBarry Smith 268063b91edcSBarry Smith outA = inA; 2681d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26829566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26839566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26842205254eSKarl Rupp 26859566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26869566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26872205254eSKarl Rupp 2688c3122656SLisandro Dalcin a->row = row; 26892205254eSKarl Rupp 26909566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26919566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26922205254eSKarl Rupp 2693c3122656SLisandro Dalcin a->col = col; 269463b91edcSBarry Smith 269536db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26969566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26979566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2698f0ec6fceSSatish Balay 269994a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 270194a9d846SBarry Smith } 270263b91edcSBarry Smith 27039566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2704137fb511SHong Zhang if (row_identity && col_identity) { 27059566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2706137fb511SHong Zhang } else { 27079566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2708137fb511SHong Zhang } 27093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2710a871dcd8SBarry Smith } 2711a871dcd8SBarry Smith 2712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2713d71ae5a4SJacob Faibussowitsch { 2714f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2715dfa0f9e5SStefano Zampini PetscScalar *v; 2716c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27173a40ed3dSBarry Smith 27183a40ed3dSBarry Smith PetscFunctionBegin; 27199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27209566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2721792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27229566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2726f0b747eeSBarry Smith } 2727f0b747eeSBarry Smith 2728d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2729d71ae5a4SJacob Faibussowitsch { 273016b64355SHong Zhang PetscInt i; 273116b64355SHong Zhang 273216b64355SHong Zhang PetscFunctionBegin; 273316b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27349566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 273516b64355SHong Zhang 273648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27379566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 273816b64355SHong Zhang 273916b64355SHong Zhang if (submatj->rbuf1) { 27409566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 274216b64355SHong Zhang } 274316b64355SHong Zhang 274448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27459566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 274716b64355SHong Zhang } 274816b64355SHong Zhang 274916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2750eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27519566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27529566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 275316b64355SHong Zhang #else 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 275516b64355SHong Zhang #endif 275616b64355SHong Zhang 275716b64355SHong Zhang if (!submatj->allcolumns) { 275816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2759eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 276016b64355SHong Zhang #else 27619566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 276216b64355SHong Zhang #endif 276316b64355SHong Zhang } 27649566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 276516b64355SHong Zhang 27669566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276816b64355SHong Zhang } 276916b64355SHong Zhang 2770d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2771d71ae5a4SJacob Faibussowitsch { 277216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27735c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 277416b64355SHong Zhang 277516b64355SHong Zhang PetscFunctionBegin; 27769566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27779566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277916b64355SHong Zhang } 278016b64355SHong Zhang 278189a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2783d71ae5a4SJacob Faibussowitsch { 27842d033e1fSHong Zhang PetscInt i; 27850fb991dcSHong Zhang Mat C; 27860fb991dcSHong Zhang Mat_SeqAIJ *c; 27870fb991dcSHong Zhang Mat_SubSppt *submatj; 27882d033e1fSHong Zhang 27892d033e1fSHong Zhang PetscFunctionBegin; 27902d033e1fSHong Zhang for (i = 0; i < n; i++) { 27910fb991dcSHong Zhang C = (*mat)[i]; 27920fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27930fb991dcSHong Zhang submatj = c->submatis1; 27942d033e1fSHong Zhang if (submatj) { 2795682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 279626cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27979566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27989566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27999566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28003faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 28019566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28029566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28039566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2804682e4c99SStefano Zampini } 28052d033e1fSHong Zhang } else { 28069566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28072d033e1fSHong Zhang } 28082d033e1fSHong Zhang } 280986e85357SHong Zhang 281063a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28119566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 281263a75b2aSHong Zhang 28139566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28152d033e1fSHong Zhang } 28162d033e1fSHong Zhang 2817d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2818d71ae5a4SJacob Faibussowitsch { 281997f1f81fSBarry Smith PetscInt i; 2820cddf8d76SBarry Smith 28213a40ed3dSBarry Smith PetscFunctionBegin; 282248a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2823cddf8d76SBarry Smith 282448a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2826cddf8d76SBarry Smith } 2827cddf8d76SBarry Smith 2828d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2829d71ae5a4SJacob Faibussowitsch { 2830e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28319a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28325d0c19d7SBarry Smith const PetscInt *idx; 28339a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2834f1af5d2fSBarry Smith PetscBT table; 2835bbd702dbSSatish Balay 28363a40ed3dSBarry Smith PetscFunctionBegin; 28379a88ca10SBarry Smith m = A->rmap->n / bs; 2838e4d965acSSatish Balay ai = a->i; 2839bfeeae90SHong Zhang aj = a->j; 28408a047759SSatish Balay 284108401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 284206763907SSatish Balay 28439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28449566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 284506763907SSatish Balay 2846e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2847b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2848e4d965acSSatish Balay isz = 0; 28499566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2850e4d965acSSatish Balay 2851e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28529566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28539566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2854e4d965acSSatish Balay 28559a88ca10SBarry Smith if (bs > 1) { 28569a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28579a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28589a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28599a88ca10SBarry Smith } 28609a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28619a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28629a88ca10SBarry Smith 28639a88ca10SBarry Smith k = 0; 28649a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28659a88ca10SBarry Smith n = isz; 28669a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28679a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28689a88ca10SBarry Smith row = bs * nidx[k] + ll; 28699a88ca10SBarry Smith start = ai[row]; 28709a88ca10SBarry Smith end = ai[row + 1]; 28719a88ca10SBarry Smith for (l = start; l < end; l++) { 28729a88ca10SBarry Smith val = aj[l] / bs; 28739a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28749a88ca10SBarry Smith } 28759a88ca10SBarry Smith } 28769a88ca10SBarry Smith } 28779a88ca10SBarry Smith } 28789a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28799a88ca10SBarry Smith } else { 2880dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2881e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28822205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28834dcbc457SBarry Smith } 28849566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28859566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2886e4d965acSSatish Balay 288704a348a9SBarry Smith k = 0; 288804a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 288904a348a9SBarry Smith n = isz; 289006763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2891e4d965acSSatish Balay row = nidx[k]; 2892e4d965acSSatish Balay start = ai[row]; 2893e4d965acSSatish Balay end = ai[row + 1]; 289404a348a9SBarry Smith for (l = start; l < end; l++) { 2895efb16452SHong Zhang val = aj[l]; 28962205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2897e4d965acSSatish Balay } 2898e4d965acSSatish Balay } 2899e4d965acSSatish Balay } 29009566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2901e4d965acSSatish Balay } 29029a88ca10SBarry Smith } 29039566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29049566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29064dcbc457SBarry Smith } 290717ab2063SBarry Smith 29080513a670SBarry Smith /* -------------------------------------------------------------- */ 2909d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2910d71ae5a4SJacob Faibussowitsch { 29110513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29123b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29135d0c19d7SBarry Smith const PetscInt *row, *col; 29145d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 291556cd22aeSBarry Smith IS icolp, irowp; 29160298fd71SBarry Smith PetscInt *cwork = NULL; 29170298fd71SBarry Smith PetscScalar *vwork = NULL; 29180513a670SBarry Smith 29193a40ed3dSBarry Smith PetscFunctionBegin; 29209566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29219566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29229566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29239566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29240513a670SBarry Smith 29250513a670SBarry Smith /* determine lengths of permuted rows */ 29269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29272205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29289566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29309566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29319566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29339566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29340513a670SBarry Smith 29359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29360513a670SBarry Smith for (i = 0; i < m; i++) { 29379566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29382205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29399566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29409566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29410513a670SBarry Smith } 29429566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29432205254eSKarl Rupp 29443c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29452205254eSKarl Rupp 29468c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29479566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29489fe5e383SStefano Zampini #endif 29499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29519566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29529566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29539566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29549566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 295548a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29570513a670SBarry Smith } 29580513a670SBarry Smith 2959d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2960d71ae5a4SJacob Faibussowitsch { 2961cb5b572fSBarry Smith PetscFunctionBegin; 296233f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 296333f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2964be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2965be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29662e5835c6SStefano Zampini const PetscScalar *aa; 2967be6bf707SBarry Smith 29689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 296908401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29709566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29719566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2973cb5b572fSBarry Smith } else { 29749566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2975cb5b572fSBarry Smith } 29763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2977cb5b572fSBarry Smith } 2978cb5b572fSBarry Smith 2979d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2980d71ae5a4SJacob Faibussowitsch { 29816c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29826e111a19SKarl Rupp 29836c0721eeSBarry Smith PetscFunctionBegin; 29846c0721eeSBarry Smith *array = a->a; 29853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29866c0721eeSBarry Smith } 29876c0721eeSBarry Smith 2988d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2989d71ae5a4SJacob Faibussowitsch { 29906c0721eeSBarry Smith PetscFunctionBegin; 2991f38c1e66SStefano Zampini *array = NULL; 29923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29936c0721eeSBarry Smith } 2994273d9f13SBarry Smith 29958229c054SShri Abhyankar /* 29968229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29978229c054SShri Abhyankar have different nonzero structure. 29988229c054SShri Abhyankar */ 2999d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 3000d71ae5a4SJacob Faibussowitsch { 3001b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 3002ec7775f6SShri Abhyankar 3003ec7775f6SShri Abhyankar PetscFunctionBegin; 3004ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3005ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 3006b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 3007b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3008b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30098af7cee1SJed Brown nnz[i] = 0; 30108af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3011b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3012b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30138af7cee1SJed Brown nnz[i]++; 30148af7cee1SJed Brown } 30158af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3016ec7775f6SShri Abhyankar } 30173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3018ec7775f6SShri Abhyankar } 3019ec7775f6SShri Abhyankar 3020d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3021d71ae5a4SJacob Faibussowitsch { 3022b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3023b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3024b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3025b264fe52SHong Zhang 3026b264fe52SHong Zhang PetscFunctionBegin; 3027b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30289566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3030b264fe52SHong Zhang } 3031b264fe52SHong Zhang 3032d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3033d71ae5a4SJacob Faibussowitsch { 3034ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3035ac90fabeSBarry Smith 3036ac90fabeSBarry Smith PetscFunctionBegin; 3037134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3038134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3039134adf20SPierre Jolivet if (e) { 30409566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 304181fa06acSBarry Smith if (e) { 30429566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3043134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 304481fa06acSBarry Smith } 304581fa06acSBarry Smith } 304654c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 304781fa06acSBarry Smith } 3048ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30492e5835c6SStefano Zampini const PetscScalar *xa; 30502e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 305181fa06acSBarry Smith PetscBLASInt one = 1, bnz; 305281fa06acSBarry Smith 30539566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3056792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30599566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30619566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3062ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30639566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3064ac90fabeSBarry Smith } else { 30658229c054SShri Abhyankar Mat B; 30668229c054SShri Abhyankar PetscInt *nnz; 30679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30689566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30699566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30709566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30719566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30729566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30749566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30759566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30769bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30779566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3078ac90fabeSBarry Smith } 30793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3080ac90fabeSBarry Smith } 3081ac90fabeSBarry Smith 3082d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3083d71ae5a4SJacob Faibussowitsch { 3084354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3085354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3086354c94deSBarry Smith PetscInt i, nz; 3087354c94deSBarry Smith PetscScalar *a; 3088354c94deSBarry Smith 3089354c94deSBarry Smith PetscFunctionBegin; 3090354c94deSBarry Smith nz = aij->nz; 30919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30922205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3094354c94deSBarry Smith #else 3095354c94deSBarry Smith PetscFunctionBegin; 3096354c94deSBarry Smith #endif 30973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3098354c94deSBarry Smith } 3099354c94deSBarry Smith 3100d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3101d71ae5a4SJacob Faibussowitsch { 3102e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3103d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3104e34fafa9SBarry Smith PetscReal atmp; 3105985db425SBarry Smith PetscScalar *x; 3106ce496241SStefano Zampini const MatScalar *aa, *av; 3107e34fafa9SBarry Smith 3108e34fafa9SBarry Smith PetscFunctionBegin; 310928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3111ce496241SStefano Zampini aa = av; 3112e34fafa9SBarry Smith ai = a->i; 3113e34fafa9SBarry Smith aj = a->j; 3114e34fafa9SBarry Smith 31159566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31169566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31179566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3119e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31209371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31219371c9d4SSatish Balay ai++; 3122e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3123985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31249371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31259371c9d4SSatish Balay x[i] = atmp; 31269371c9d4SSatish Balay if (idx) idx[i] = *aj; 31279371c9d4SSatish Balay } 31289371c9d4SSatish Balay aa++; 31299371c9d4SSatish Balay aj++; 3130985db425SBarry Smith } 3131985db425SBarry Smith } 31329566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3135985db425SBarry Smith } 3136985db425SBarry Smith 3137d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3138d71ae5a4SJacob Faibussowitsch { 3139985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3140d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3141985db425SBarry Smith PetscScalar *x; 3142ce496241SStefano Zampini const MatScalar *aa, *av; 3143985db425SBarry Smith 3144985db425SBarry Smith PetscFunctionBegin; 314528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3147ce496241SStefano Zampini aa = av; 3148985db425SBarry Smith ai = a->i; 3149985db425SBarry Smith aj = a->j; 3150985db425SBarry Smith 31519566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31529566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31539566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 315408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3155985db425SBarry Smith for (i = 0; i < m; i++) { 31569371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31579371c9d4SSatish Balay ai++; 3158d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31599371c9d4SSatish Balay x[i] = *aa; 31609371c9d4SSatish Balay if (idx) idx[i] = 0; 3161985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3162985db425SBarry Smith x[i] = 0.0; 3163985db425SBarry Smith if (idx) { 3164985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3165985db425SBarry Smith if (aj[j] > j) { 3166985db425SBarry Smith idx[i] = j; 3167985db425SBarry Smith break; 3168985db425SBarry Smith } 3169985db425SBarry Smith } 31701a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31711a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3172985db425SBarry Smith } 3173985db425SBarry Smith } 3174985db425SBarry Smith for (j = 0; j < ncols; j++) { 31759371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31769371c9d4SSatish Balay x[i] = *aa; 31779371c9d4SSatish Balay if (idx) idx[i] = *aj; 31789371c9d4SSatish Balay } 31799371c9d4SSatish Balay aa++; 31809371c9d4SSatish Balay aj++; 3181985db425SBarry Smith } 3182985db425SBarry Smith } 31839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3186985db425SBarry Smith } 3187985db425SBarry Smith 3188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3189d71ae5a4SJacob Faibussowitsch { 3190c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3191c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3192ce496241SStefano Zampini PetscScalar *x; 3193ce496241SStefano Zampini const MatScalar *aa, *av; 3194c87e5d42SMatthew Knepley 3195c87e5d42SMatthew Knepley PetscFunctionBegin; 31969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3197ce496241SStefano Zampini aa = av; 3198c87e5d42SMatthew Knepley ai = a->i; 3199c87e5d42SMatthew Knepley aj = a->j; 3200c87e5d42SMatthew Knepley 32019566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32029566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32039566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 320408401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3205c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32069371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32079371c9d4SSatish Balay ai++; 3208f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32099371c9d4SSatish Balay x[i] = *aa; 32109371c9d4SSatish Balay if (idx) idx[i] = 0; 3211f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3212f07e67edSHong Zhang x[i] = 0.0; 3213f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3214289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3215f07e67edSHong Zhang if (aj[j] > j) { 3216f07e67edSHong Zhang idx[i] = j; 32172205254eSKarl Rupp break; 32182205254eSKarl Rupp } 3219289a08f5SMatthew Knepley } 3220f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3221f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3222f07e67edSHong Zhang } 3223289a08f5SMatthew Knepley } 3224c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32259371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32269371c9d4SSatish Balay x[i] = *aa; 32279371c9d4SSatish Balay if (idx) idx[i] = *aj; 32289371c9d4SSatish Balay } 32299371c9d4SSatish Balay aa++; 32309371c9d4SSatish Balay aj++; 3231c87e5d42SMatthew Knepley } 3232c87e5d42SMatthew Knepley } 32339566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3236c87e5d42SMatthew Knepley } 3237c87e5d42SMatthew Knepley 3238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3239d71ae5a4SJacob Faibussowitsch { 3240985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3241d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3242d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3243985db425SBarry Smith PetscScalar *x; 3244ce496241SStefano Zampini const MatScalar *aa, *av; 3245985db425SBarry Smith 3246985db425SBarry Smith PetscFunctionBegin; 324728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3249ce496241SStefano Zampini aa = av; 3250985db425SBarry Smith ai = a->i; 3251985db425SBarry Smith aj = a->j; 3252985db425SBarry Smith 32539566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32549566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32559566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 325608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3257985db425SBarry Smith for (i = 0; i < m; i++) { 32589371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32599371c9d4SSatish Balay ai++; 3260d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32619371c9d4SSatish Balay x[i] = *aa; 32629371c9d4SSatish Balay if (idx) idx[i] = 0; 3263985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3264985db425SBarry Smith x[i] = 0.0; 3265985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3266985db425SBarry Smith for (j = 0; j < ncols; j++) { 3267985db425SBarry Smith if (aj[j] > j) { 3268985db425SBarry Smith idx[i] = j; 3269985db425SBarry Smith break; 3270985db425SBarry Smith } 3271985db425SBarry Smith } 3272fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3273fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3274985db425SBarry Smith } 3275985db425SBarry Smith } 3276985db425SBarry Smith for (j = 0; j < ncols; j++) { 32779371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32789371c9d4SSatish Balay x[i] = *aa; 32799371c9d4SSatish Balay if (idx) idx[i] = *aj; 32809371c9d4SSatish Balay } 32819371c9d4SSatish Balay aa++; 32829371c9d4SSatish Balay aj++; 3283e34fafa9SBarry Smith } 3284e34fafa9SBarry Smith } 32859566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3288e34fafa9SBarry Smith } 3289bbead8a2SBarry Smith 3290d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3291d71ae5a4SJacob Faibussowitsch { 3292bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 329333d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3294bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32950da83c2eSBarry Smith const PetscReal shift = 0.0; 32961a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3297bbead8a2SBarry Smith 3298bbead8a2SBarry Smith PetscFunctionBegin; 3299a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33004a0d0026SBarry Smith if (a->ibdiagvalid) { 33014a0d0026SBarry Smith if (values) *values = a->ibdiag; 33023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33034a0d0026SBarry Smith } 33049566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33054dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3306bbead8a2SBarry Smith diag = a->ibdiag; 3307bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3308bbead8a2SBarry Smith /* factor and invert each block */ 3309bbead8a2SBarry Smith switch (bs) { 3310bbead8a2SBarry Smith case 1: 3311bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33129566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3313ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3314ec1892c8SHong Zhang if (allowzeropivot) { 33157b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33167b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33177b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33189566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 331998921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3320ec1892c8SHong Zhang } 3321bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3322bbead8a2SBarry Smith } 3323bbead8a2SBarry Smith break; 3324bbead8a2SBarry Smith case 2: 3325bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33269371c9d4SSatish Balay ij[0] = 2 * i; 33279371c9d4SSatish Balay ij[1] = 2 * i + 1; 33289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33307b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3332bbead8a2SBarry Smith diag += 4; 3333bbead8a2SBarry Smith } 3334bbead8a2SBarry Smith break; 3335bbead8a2SBarry Smith case 3: 3336bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33379371c9d4SSatish Balay ij[0] = 3 * i; 33389371c9d4SSatish Balay ij[1] = 3 * i + 1; 33399371c9d4SSatish Balay ij[2] = 3 * i + 2; 33409566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33427b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3344bbead8a2SBarry Smith diag += 9; 3345bbead8a2SBarry Smith } 3346bbead8a2SBarry Smith break; 3347bbead8a2SBarry Smith case 4: 3348bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33499371c9d4SSatish Balay ij[0] = 4 * i; 33509371c9d4SSatish Balay ij[1] = 4 * i + 1; 33519371c9d4SSatish Balay ij[2] = 4 * i + 2; 33529371c9d4SSatish Balay ij[3] = 4 * i + 3; 33539566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33557b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3357bbead8a2SBarry Smith diag += 16; 3358bbead8a2SBarry Smith } 3359bbead8a2SBarry Smith break; 3360bbead8a2SBarry Smith case 5: 3361bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33629371c9d4SSatish Balay ij[0] = 5 * i; 33639371c9d4SSatish Balay ij[1] = 5 * i + 1; 33649371c9d4SSatish Balay ij[2] = 5 * i + 2; 33659371c9d4SSatish Balay ij[3] = 5 * i + 3; 33669371c9d4SSatish Balay ij[4] = 5 * i + 4; 33679566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33689566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33697b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3371bbead8a2SBarry Smith diag += 25; 3372bbead8a2SBarry Smith } 3373bbead8a2SBarry Smith break; 3374bbead8a2SBarry Smith case 6: 3375bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33769371c9d4SSatish Balay ij[0] = 6 * i; 33779371c9d4SSatish Balay ij[1] = 6 * i + 1; 33789371c9d4SSatish Balay ij[2] = 6 * i + 2; 33799371c9d4SSatish Balay ij[3] = 6 * i + 3; 33809371c9d4SSatish Balay ij[4] = 6 * i + 4; 33819371c9d4SSatish Balay ij[5] = 6 * i + 5; 33829566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33839566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33847b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3386bbead8a2SBarry Smith diag += 36; 3387bbead8a2SBarry Smith } 3388bbead8a2SBarry Smith break; 3389bbead8a2SBarry Smith case 7: 3390bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33919371c9d4SSatish Balay ij[0] = 7 * i; 33929371c9d4SSatish Balay ij[1] = 7 * i + 1; 33939371c9d4SSatish Balay ij[2] = 7 * i + 2; 33949371c9d4SSatish Balay ij[3] = 7 * i + 3; 33959371c9d4SSatish Balay ij[4] = 7 * i + 4; 33969371c9d4SSatish Balay ij[5] = 7 * i + 5; 3397cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 33989566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 33999566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34007b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3402bbead8a2SBarry Smith diag += 49; 3403bbead8a2SBarry Smith } 3404bbead8a2SBarry Smith break; 3405bbead8a2SBarry Smith default: 34069566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3407bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3408ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34099566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34109566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34117b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34129566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3413bbead8a2SBarry Smith diag += bs2; 3414bbead8a2SBarry Smith } 34159566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3416bbead8a2SBarry Smith } 3417bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3419bbead8a2SBarry Smith } 3420bbead8a2SBarry Smith 3421d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3422d71ae5a4SJacob Faibussowitsch { 342373a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3424fff043a9SJunchao Zhang PetscScalar a, *aa; 342573a71a0fSBarry Smith PetscInt m, n, i, j, col; 342673a71a0fSBarry Smith 342773a71a0fSBarry Smith PetscFunctionBegin; 342873a71a0fSBarry Smith if (!x->assembled) { 34299566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 343073a71a0fSBarry Smith for (i = 0; i < m; i++) { 343173a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34329566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 343373a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34349566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 343573a71a0fSBarry Smith } 343673a71a0fSBarry Smith } 3437e2ce353bSJunchao Zhang } else { 34389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34399566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3441e2ce353bSJunchao Zhang } 34429566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34439566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 344573a71a0fSBarry Smith } 344673a71a0fSBarry Smith 3447679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3449d71ae5a4SJacob Faibussowitsch { 3450679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3451679944adSJunchao Zhang PetscScalar a; 3452679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3453679944adSJunchao Zhang 3454679944adSJunchao Zhang PetscFunctionBegin; 3455679944adSJunchao Zhang nskip = high - low; 34569566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3457679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3458679944adSJunchao Zhang for (i = 0; i < m; i++) { 3459679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34609566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3461679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3462679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34639566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3464679944adSJunchao Zhang } 3465e2ce353bSJunchao Zhang } 34669566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34679566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3469679944adSJunchao Zhang } 3470679944adSJunchao Zhang 3471682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34720a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3473cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3474cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3475cb5b572fSBarry Smith MatMult_SeqAIJ, 347697304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34777c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34787c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3479f4259b30SLisandro Dalcin NULL, 3480f4259b30SLisandro Dalcin NULL, 3481f4259b30SLisandro Dalcin NULL, 3482f4259b30SLisandro Dalcin /* 10*/ NULL, 3483cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3484f4259b30SLisandro Dalcin NULL, 348541f059aeSBarry Smith MatSOR_SeqAIJ, 348691e9d3e2SHong Zhang MatTranspose_SeqAIJ, 348797304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3488cb5b572fSBarry Smith MatEqual_SeqAIJ, 3489cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3490cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3491cb5b572fSBarry Smith MatNorm_SeqAIJ, 3492f4259b30SLisandro Dalcin /* 20*/ NULL, 3493cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3494cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3495cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3496d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3497f4259b30SLisandro Dalcin NULL, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 350126cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 3506d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3510f4259b30SLisandro Dalcin NULL, 3511d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35127dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3513cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3514cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3515cb5b572fSBarry Smith MatCopy_SeqAIJ, 3516d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3517cb5b572fSBarry Smith MatScale_SeqAIJ, 35187d68702bSBarry Smith MatShift_SeqAIJ, 351979299369SBarry Smith MatDiagonalSet_SeqAIJ, 35206e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352173a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35223b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35233b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35243b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3525a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352693dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3527f4259b30SLisandro Dalcin NULL, 3528f4259b30SLisandro Dalcin NULL, 3529cda55fadSBarry Smith MatPermute_SeqAIJ, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin /* 59*/ NULL, 3532b9b97703SBarry Smith MatDestroy_SeqAIJ, 3533b9b97703SBarry Smith MatView_SeqAIJ, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin /* 64*/ NULL, 3537321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3542c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546f4259b30SLisandro Dalcin /* 74*/ NULL, 35473acb8795SBarry Smith MatFDColoringApply_AIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 35516ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555bc011b1eSHong Zhang MatLoad_SeqAIJ, 3556d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35571cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin /* 89*/ NULL, 3562f4259b30SLisandro Dalcin NULL, 356326be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 35668fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 35696fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3570f4259b30SLisandro Dalcin NULL, 35714222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3572f4259b30SLisandro Dalcin NULL, 3573f4259b30SLisandro Dalcin NULL, 357487d4246cSBarry Smith MatConjugate_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 3576d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 357799cafbc1SBarry Smith MatRealPart_SeqAIJ, 3578f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 3581cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3582f4259b30SLisandro Dalcin NULL, 35832af78befSBarry Smith MatGetRowMin_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 3585599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3586f4259b30SLisandro Dalcin /*114*/ NULL, 3587f4259b30SLisandro Dalcin NULL, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin /*119*/ NULL, 3592f4259b30SLisandro Dalcin NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35960716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3597a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 359837868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35990da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3600f4259b30SLisandro Dalcin NULL, 3601f4259b30SLisandro Dalcin /*129*/ NULL, 3602f4259b30SLisandro Dalcin NULL, 3603f4259b30SLisandro Dalcin NULL, 360475648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3605b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3606b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36072b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3608f4259b30SLisandro Dalcin NULL, 3609f4259b30SLisandro Dalcin NULL, 36103964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3611f4259b30SLisandro Dalcin /*139*/ NULL, 3612f4259b30SLisandro Dalcin NULL, 3613f4259b30SLisandro Dalcin NULL, 36143a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36159c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36164222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36174222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3618f4259b30SLisandro Dalcin NULL, 361972833a62Smarkadams4 NULL, 362072833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36212d776b49SBarry Smith NULL, 3622dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3623dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 362417ab2063SBarry Smith 3625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3626d71ae5a4SJacob Faibussowitsch { 3627bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 362897f1f81fSBarry Smith PetscInt i, nz, n; 3629bef8e0ddSBarry Smith 3630bef8e0ddSBarry Smith PetscFunctionBegin; 3631bef8e0ddSBarry Smith nz = aij->maxnz; 3632d0f46423SBarry Smith n = mat->rmap->n; 3633ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3634bef8e0ddSBarry Smith aij->nz = nz; 3635ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3637bef8e0ddSBarry Smith } 3638bef8e0ddSBarry Smith 3639a3bb6f32SFande Kong /* 3640ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3641ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3642ddea5d60SJunchao Zhang */ 3643d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3644d71ae5a4SJacob Faibussowitsch { 3645a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3646eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3647eec179cfSJacob Faibussowitsch PetscHashIter tpos; 364825b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 364925b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3650a3bb6f32SFande Kong 3651a3bb6f32SFande Kong PetscFunctionBegin; 3652a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3653a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3654a3bb6f32SFande Kong /* use a table */ 3655eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3656a3bb6f32SFande Kong ec = 0; 365725b670f0SStefano Zampini for (i = 0; i < nz; i++) { 365825b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3659eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3660a3bb6f32SFande Kong if (!data) { 3661a3bb6f32SFande Kong /* one based table */ 3662c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3663a3bb6f32SFande Kong } 3664a3bb6f32SFande Kong } 3665a3bb6f32SFande Kong /* form array of columns we need */ 36669566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3667eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3668eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3669eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3670eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3671eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3672a3bb6f32SFande Kong gid--; 3673a3bb6f32SFande Kong lid--; 3674a3bb6f32SFande Kong garray[lid] = gid; 3675a3bb6f32SFande Kong } 36769566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3677eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3678c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3679a3bb6f32SFande Kong /* compact out the extra columns in B */ 368025b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368125b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3682eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3683a3bb6f32SFande Kong lid--; 368425b670f0SStefano Zampini jj[i] = lid; 3685a3bb6f32SFande Kong } 36869566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3687eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36889566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36899566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36909566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3692a3bb6f32SFande Kong } 3693a3bb6f32SFande Kong 3694bef8e0ddSBarry Smith /*@ 3695bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3696bef8e0ddSBarry Smith in the matrix. 3697bef8e0ddSBarry Smith 3698bef8e0ddSBarry Smith Input Parameters: 369911a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3700bef8e0ddSBarry Smith - indices - the column indices 3701bef8e0ddSBarry Smith 370215091d37SBarry Smith Level: advanced 370315091d37SBarry Smith 3704bef8e0ddSBarry Smith Notes: 3705bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3706bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 370711a5261eSBarry Smith of the `MatSetValues()` operation. 3708bef8e0ddSBarry Smith 3709bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371011a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3711bef8e0ddSBarry Smith 371211a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3713bef8e0ddSBarry Smith 3714b9617806SBarry Smith The indices should start with zero, not one. 3715b9617806SBarry Smith 3716bef8e0ddSBarry Smith @*/ 3717d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3718d71ae5a4SJacob Faibussowitsch { 3719bef8e0ddSBarry Smith PetscFunctionBegin; 37200700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3721dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3722cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3724bef8e0ddSBarry Smith } 3725bef8e0ddSBarry Smith 3726be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3727be6bf707SBarry Smith 3728d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3729d71ae5a4SJacob Faibussowitsch { 3730be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3731d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3732be6bf707SBarry Smith 3733be6bf707SBarry Smith PetscFunctionBegin; 373428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3735be6bf707SBarry Smith 3736be6bf707SBarry Smith /* allocate space for values if not already there */ 37374dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith /* copy values over */ 37409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3742be6bf707SBarry Smith } 3743be6bf707SBarry Smith 3744be6bf707SBarry Smith /*@ 3745be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3746be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3747be6bf707SBarry Smith nonlinear portion. 3748be6bf707SBarry Smith 3749c3339decSBarry Smith Logically Collect 3750be6bf707SBarry Smith 3751*27430b45SBarry Smith Input Parameter: 375211a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3753be6bf707SBarry Smith 375415091d37SBarry Smith Level: advanced 375515091d37SBarry Smith 3756*27430b45SBarry Smith Usage: 3757*27430b45SBarry Smith .vb 3758*27430b45SBarry Smith Using `SNES` 3759*27430b45SBarry Smith Create Jacobian matrix 3760*27430b45SBarry Smith Set linear terms into matrix 3761*27430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 3762*27430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 3763*27430b45SBarry Smith boundary conditions again will not change the nonzero structure 3764*27430b45SBarry Smith MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3765*27430b45SBarry Smith MatStoreValues(mat); 3766*27430b45SBarry Smith Call SNESSetJacobian() with matrix 3767*27430b45SBarry Smith In your Jacobian routine 3768*27430b45SBarry Smith MatRetrieveValues(mat); 3769*27430b45SBarry Smith Set nonlinear terms in matrix 3770be6bf707SBarry Smith 3771*27430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 3772*27430b45SBarry Smith // build linear portion of Jacobian 3773*27430b45SBarry Smith MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3774*27430b45SBarry Smith MatStoreValues(mat); 3775*27430b45SBarry Smith loop over nonlinear iterations 3776*27430b45SBarry Smith MatRetrieveValues(mat); 3777*27430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3778*27430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 3779*27430b45SBarry Smith Solve linear system with Jacobian 3780*27430b45SBarry Smith endloop 3781*27430b45SBarry Smith .ve 3782be6bf707SBarry Smith 3783be6bf707SBarry Smith Notes: 3784da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 378511a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3786be6bf707SBarry Smith calling this routine. 3787be6bf707SBarry Smith 37880c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37890c468ba9SBarry Smith and does not allocated additional space. 37900c468ba9SBarry Smith 3791*27430b45SBarry Smith .seealso: `Mat`, `MatRetrieveValues()` 3792be6bf707SBarry Smith @*/ 3793d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3794d71ae5a4SJacob Faibussowitsch { 3795be6bf707SBarry Smith PetscFunctionBegin; 37960700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379728b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379828b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3799cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3801be6bf707SBarry Smith } 3802be6bf707SBarry Smith 3803d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3804d71ae5a4SJacob Faibussowitsch { 3805be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3806d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3807be6bf707SBarry Smith 3808be6bf707SBarry Smith PetscFunctionBegin; 380928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381028b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3811be6bf707SBarry Smith /* copy values over */ 38129566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3814be6bf707SBarry Smith } 3815be6bf707SBarry Smith 3816be6bf707SBarry Smith /*@ 3817be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3818be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3819be6bf707SBarry Smith nonlinear portion. 3820be6bf707SBarry Smith 3821c3339decSBarry Smith Logically Collect 3822be6bf707SBarry Smith 3823be6bf707SBarry Smith Input Parameters: 382411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3825be6bf707SBarry Smith 382615091d37SBarry Smith Level: advanced 382715091d37SBarry Smith 3828db781477SPatrick Sanan .seealso: `MatStoreValues()` 3829be6bf707SBarry Smith @*/ 3830d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3831d71ae5a4SJacob Faibussowitsch { 3832be6bf707SBarry Smith PetscFunctionBegin; 38330700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383428b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 383528b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3836cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3838be6bf707SBarry Smith } 3839be6bf707SBarry Smith 3840be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 384117ab2063SBarry Smith /*@C 384211a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38430d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38446e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 384551c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38462bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 384717ab2063SBarry Smith 3848d083f849SBarry Smith Collective 3849db81eaa0SLois Curfman McInnes 385017ab2063SBarry Smith Input Parameters: 385111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 385217ab2063SBarry Smith . m - number of rows 385317ab2063SBarry Smith . n - number of columns 385417ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385551c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38560298fd71SBarry Smith (possibly different for each row) or NULL 385717ab2063SBarry Smith 385817ab2063SBarry Smith Output Parameter: 3859416022c9SBarry Smith . A - the matrix 386017ab2063SBarry Smith 386111a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 3862f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 386311a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 3864175b88e8SBarry Smith 3865b259b22eSLois Curfman McInnes Notes: 386649a6f317SBarry Smith If nnz is given then nz is ignored 386749a6f317SBarry Smith 386811a5261eSBarry Smith The AIJ format, also called 386911a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 38700002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 387144cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 387217ab2063SBarry Smith 387317ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 387411a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 38753d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38766da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 387717ab2063SBarry Smith 3878682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38794fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3880682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38816c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38826c7ebb05SLois Curfman McInnes 38836c7ebb05SLois Curfman McInnes Options Database Keys: 3884698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38859db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 388617ab2063SBarry Smith 3887027ccd11SLois Curfman McInnes Level: intermediate 3888027ccd11SLois Curfman McInnes 388960161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 389017ab2063SBarry Smith @*/ 3891d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3892d71ae5a4SJacob Faibussowitsch { 38933a40ed3dSBarry Smith PetscFunctionBegin; 38949566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38959566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38969566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3899273d9f13SBarry Smith } 3900273d9f13SBarry Smith 3901273d9f13SBarry Smith /*@C 3902273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3903273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3904273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3905273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3906273d9f13SBarry Smith 3907d083f849SBarry Smith Collective 3908273d9f13SBarry Smith 3909273d9f13SBarry Smith Input Parameters: 39101c4f3114SJed Brown + B - The matrix 3911273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3912273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39130298fd71SBarry Smith (possibly different for each row) or NULL 3914273d9f13SBarry Smith 3915273d9f13SBarry Smith Notes: 391649a6f317SBarry Smith If nnz is given then nz is ignored 391749a6f317SBarry Smith 391811a5261eSBarry Smith The `MATSEQAIJ` format also called 391911a5261eSBarry Smith compressed row storage, is fully compatible with standard Fortran 77 3920273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3921273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3922273d9f13SBarry Smith 3923273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 392411a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 3925273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3926273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3927273d9f13SBarry Smith 392811a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3929aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3930aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3931aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3932aa95bbe8SBarry Smith 393311a5261eSBarry Smith Developer Notes: 393411a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3935a96a251dSBarry Smith entries or columns indices 3936a96a251dSBarry Smith 3937273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3938273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3939273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3940273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3941273d9f13SBarry Smith 3942273d9f13SBarry Smith Options Database Keys: 3943698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 394447b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3945273d9f13SBarry Smith 3946273d9f13SBarry Smith Level: intermediate 3947273d9f13SBarry Smith 3948db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3949db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3950273d9f13SBarry Smith @*/ 3951d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3952d71ae5a4SJacob Faibussowitsch { 3953a23d5eceSKris Buschelman PetscFunctionBegin; 39546ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39556ba663aaSJed Brown PetscValidType(B, 1); 3956cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3958a23d5eceSKris Buschelman } 3959a23d5eceSKris Buschelman 3960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3961d71ae5a4SJacob Faibussowitsch { 3962ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39632576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 396497f1f81fSBarry Smith PetscInt i; 3965273d9f13SBarry Smith 3966273d9f13SBarry Smith PetscFunctionBegin; 3967ad79cf63SBarry Smith if (B->hash_active) { 3968ad79cf63SBarry Smith PetscCall(PetscMemcpy(&B->ops, &b->cops, sizeof(*(B->ops)))); 3969ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3970ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3971ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3972ad79cf63SBarry Smith } 39732576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3974a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3975c461c341SBarry Smith skipallocation = PETSC_TRUE; 3976c461c341SBarry Smith nz = 0; 3977c461c341SBarry Smith } 39789566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39799566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3980899cda47SBarry Smith 3981435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 398208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3983cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3984d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 398508401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 398608401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3987b73539f3SBarry Smith } 3988b73539f3SBarry Smith } 3989b73539f3SBarry Smith 3990273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3991ab93d7beSBarry Smith if (!skipallocation) { 39924dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3993071fcb05SBarry Smith if (!b->ilen) { 3994071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39959566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3996071fcb05SBarry Smith } else { 39979566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39982ee49352SLisandro Dalcin } 39994dfa11a4SJacob Faibussowitsch if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); } 4000273d9f13SBarry Smith if (!nnz) { 4001435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4002c62bd62aSJed Brown else if (nz < 0) nz = 1; 40035d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4004d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4005d0f46423SBarry Smith nz = nz * B->rmap->n; 4006273d9f13SBarry Smith } else { 4007c73702f5SBarry Smith PetscInt64 nz64 = 0; 40089371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40099371c9d4SSatish Balay b->imax[i] = nnz[i]; 40109371c9d4SSatish Balay nz64 += nnz[i]; 40119371c9d4SSatish Balay } 40129566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4013273d9f13SBarry Smith } 4014ab93d7beSBarry Smith 4015273d9f13SBarry Smith /* allocate the matrix space */ 401653dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40179566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4018396832f4SHong Zhang if (B->structure_only) { 40199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4021396832f4SHong Zhang } else { 40229566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4023396832f4SHong Zhang } 4024bfeeae90SHong Zhang b->i[0] = 0; 4025ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4026396832f4SHong Zhang if (B->structure_only) { 4027396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4028396832f4SHong Zhang b->free_a = PETSC_FALSE; 4029396832f4SHong Zhang } else { 4030273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4031e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4032396832f4SHong Zhang } 4033e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4034c461c341SBarry Smith } else { 4035e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4036e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4037c461c341SBarry Smith } 4038273d9f13SBarry Smith 4039846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4040846b4da1SFande Kong /* reserve user-requested sparsity */ 40419566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4042846b4da1SFande Kong } 4043846b4da1SFande Kong 4044273d9f13SBarry Smith b->nz = 0; 4045273d9f13SBarry Smith b->maxnz = nz; 4046273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40471baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4048cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4049cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40505519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40515519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40525519a089SJose E. Roman */ 40535519a089SJose E. Roman B->nonzerostate++; 40543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4055273d9f13SBarry Smith } 4056273d9f13SBarry Smith 4057d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4058d71ae5a4SJacob Faibussowitsch { 4059846b4da1SFande Kong Mat_SeqAIJ *a; 4060a5bbaf83SFande Kong PetscInt i; 4061846b4da1SFande Kong 4062846b4da1SFande Kong PetscFunctionBegin; 4063846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 406414d0e64fSAlex Lindsay 406514d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40663ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 406714d0e64fSAlex Lindsay 4068846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40692c814fdeSFande Kong /* if no saved info, we error out */ 407028b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40712c814fdeSFande Kong 4072aed4548fSBarry Smith PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40732c814fdeSFande Kong 40749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40759566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4076846b4da1SFande Kong a->i[0] = 0; 4077ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4078846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4079846b4da1SFande Kong a->nz = 0; 4080846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4081846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4082846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4083846b4da1SFande Kong A->assembled = PETSC_FALSE; 40843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4085846b4da1SFande Kong } 4086846b4da1SFande Kong 408758d36128SBarry Smith /*@ 408811a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4089a1661176SMatthew Knepley 4090a1661176SMatthew Knepley Input Parameters: 4091a1661176SMatthew Knepley + B - the matrix 4092a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4093a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4094a1661176SMatthew Knepley - v - optional values in the matrix 4095a1661176SMatthew Knepley 4096a1661176SMatthew Knepley Level: developer 4097a1661176SMatthew Knepley 40986a9b8d82SBarry Smith Notes: 409911a5261eSBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 410058d36128SBarry Smith 41016a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41026a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41036a9b8d82SBarry Smith 41046a9b8d82SBarry Smith Developer Notes: 41056a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 410611a5261eSBarry Smith then just copies the v values directly with `PetscMemcpy()`. 41076a9b8d82SBarry Smith 410811a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41096a9b8d82SBarry Smith 4110db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4111a1661176SMatthew Knepley @*/ 4112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4113d71ae5a4SJacob Faibussowitsch { 4114a1661176SMatthew Knepley PetscFunctionBegin; 41150700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41166ba663aaSJed Brown PetscValidType(B, 1); 4117cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4119a1661176SMatthew Knepley } 4120a1661176SMatthew Knepley 4121d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4122d71ae5a4SJacob Faibussowitsch { 4123a1661176SMatthew Knepley PetscInt i; 4124a1661176SMatthew Knepley PetscInt m, n; 4125a1661176SMatthew Knepley PetscInt nz; 41266a9b8d82SBarry Smith PetscInt *nnz; 4127a1661176SMatthew Knepley 4128a1661176SMatthew Knepley PetscFunctionBegin; 4129aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4130779a8d59SSatish Balay 41319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41329566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4133779a8d59SSatish Balay 41349566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41359566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4136a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4137b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 413808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4139a1661176SMatthew Knepley nnz[i] = nz; 4140a1661176SMatthew Knepley } 41419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41429566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4143a1661176SMatthew Knepley 414448a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4145a1661176SMatthew Knepley 41469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4148a1661176SMatthew Knepley 41499566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4151a1661176SMatthew Knepley } 4152a1661176SMatthew Knepley 4153ad7e164aSPierre Jolivet /*@ 4154ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4155ad7e164aSPierre Jolivet 4156ad7e164aSPierre Jolivet Input Parameters: 4157ad7e164aSPierre Jolivet + A - left-hand side matrix 4158ad7e164aSPierre Jolivet . B - right-hand side matrix 415911a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4160ad7e164aSPierre Jolivet 4161ad7e164aSPierre Jolivet Output Parameter: 4162ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4163ad7e164aSPierre Jolivet 4164ad7e164aSPierre Jolivet Level: intermediate 4165ad7e164aSPierre Jolivet 416611a5261eSBarry Smith Note: 416711a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4168ad7e164aSPierre Jolivet 4169db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4170ad7e164aSPierre Jolivet @*/ 4171d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4172d71ae5a4SJacob Faibussowitsch { 4173ad7e164aSPierre Jolivet PetscFunctionBegin; 4174ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4175ad7e164aSPierre Jolivet PetscValidType(A, 1); 4176ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4177ad7e164aSPierre Jolivet PetscValidType(B, 2); 4178ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4179ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4180ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4181ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4182ad7e164aSPierre Jolivet } 4183cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4185ad7e164aSPierre Jolivet } 4186ad7e164aSPierre Jolivet 4187d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4188d71ae5a4SJacob Faibussowitsch { 4189ad7e164aSPierre Jolivet Mat newmat; 4190ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4191ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4192ad7e164aSPierre Jolivet PetscScalar *v; 4193fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4194ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4195ad7e164aSPierre Jolivet PetscBool flg; 4196ad7e164aSPierre Jolivet 4197ad7e164aSPierre Jolivet PetscFunctionBegin; 419828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419928b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 420028b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420128b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 420328b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4204aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4205ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42069566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42079566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42089566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42099566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4210ad7e164aSPierre Jolivet i[0] = 0; 4211ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4212ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4213ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4214ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4215ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4216ad7e164aSPierre Jolivet } 4217ad7e164aSPierre Jolivet } 4218ad7e164aSPierre Jolivet } 42199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4220ad7e164aSPierre Jolivet *C = newmat; 42219566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4222ad7e164aSPierre Jolivet nnz = 0; 4223ad7e164aSPierre Jolivet } 42249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4227ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4228ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4229ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4230ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4231ad7e164aSPierre Jolivet } 4232ad7e164aSPierre Jolivet } 4233ad7e164aSPierre Jolivet } 42349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4238ad7e164aSPierre Jolivet } 4239ad7e164aSPierre Jolivet 4240c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4241af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4242170fe5c8SBarry Smith 4243170fe5c8SBarry Smith /* 4244170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4245170fe5c8SBarry Smith 4246170fe5c8SBarry Smith n p p 42472da392ccSBarry Smith [ ] [ ] [ ] 42482da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42492da392ccSBarry Smith [ ] [ ] [ ] 4250170fe5c8SBarry Smith 4251170fe5c8SBarry Smith */ 4252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4253d71ae5a4SJacob Faibussowitsch { 4254170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4255170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4256170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 425786214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4258170fe5c8SBarry Smith const PetscInt *ii, *idx; 4259170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4260170fe5c8SBarry Smith PetscScalar *c, *c_q; 426186214ceeSStefano Zampini PetscInt clda = sub_c->lda; 426286214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4263170fe5c8SBarry Smith 4264170fe5c8SBarry Smith PetscFunctionBegin; 4265d0f46423SBarry Smith m = A->rmap->n; 4266d0f46423SBarry Smith n = A->cmap->n; 4267d0f46423SBarry Smith p = B->cmap->n; 4268170fe5c8SBarry Smith a = sub_a->v; 4269170fe5c8SBarry Smith b = sub_b->a; 4270170fe5c8SBarry Smith c = sub_c->v; 427186214ceeSStefano Zampini if (clda == m) { 42729566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 427386214ceeSStefano Zampini } else { 427486214ceeSStefano Zampini for (j = 0; j < p; j++) 42759371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 427686214ceeSStefano Zampini } 4277170fe5c8SBarry Smith ii = sub_b->i; 4278170fe5c8SBarry Smith idx = sub_b->j; 4279170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4280170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4281170fe5c8SBarry Smith while (q-- > 0) { 428286214ceeSStefano Zampini c_q = c + clda * (*idx); 428386214ceeSStefano Zampini a_q = a + alda * i; 4284854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4285170fe5c8SBarry Smith idx++; 4286170fe5c8SBarry Smith b++; 4287170fe5c8SBarry Smith } 4288170fe5c8SBarry Smith } 42893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4290170fe5c8SBarry Smith } 4291170fe5c8SBarry Smith 4292d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4293d71ae5a4SJacob Faibussowitsch { 4294d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 429586214ceeSStefano Zampini PetscBool cisdense; 4296170fe5c8SBarry Smith 4297170fe5c8SBarry Smith PetscFunctionBegin; 429808401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42999566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43009566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4301d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 430248a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43039566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4304d73949e8SHong Zhang 43054222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4307170fe5c8SBarry Smith } 4308170fe5c8SBarry Smith 4309170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 43100bad9183SKris Buschelman /*MC 4311fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43120bad9183SKris Buschelman based on compressed sparse row format. 43130bad9183SKris Buschelman 43140bad9183SKris Buschelman Options Database Keys: 43150bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43160bad9183SKris Buschelman 43170bad9183SKris Buschelman Level: beginner 43180bad9183SKris Buschelman 43190cd7f59aSBarry Smith Notes: 432011a5261eSBarry Smith `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values, 43210cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43220cd7f59aSBarry Smith in the matrix 43230cd7f59aSBarry Smith 432411a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 432511a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43260cd7f59aSBarry Smith 432711a5261eSBarry Smith Developer Note: 43280cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43290cd7f59aSBarry Smith 4330db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43310bad9183SKris Buschelman M*/ 43320bad9183SKris Buschelman 4333ccd284c7SBarry Smith /*MC 4334ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4335ccd284c7SBarry Smith 433611a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 433711a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 433811a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4339ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4340ccd284c7SBarry Smith the above preallocation routines for simplicity. 4341ccd284c7SBarry Smith 4342ccd284c7SBarry Smith Options Database Keys: 434311a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4344ccd284c7SBarry Smith 434511a5261eSBarry Smith Note: 434611a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4347ccd284c7SBarry Smith enough exist. 4348ccd284c7SBarry Smith 4349ccd284c7SBarry Smith Level: beginner 4350ccd284c7SBarry Smith 4351db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4352ccd284c7SBarry Smith M*/ 4353ccd284c7SBarry Smith 4354ccd284c7SBarry Smith /*MC 4355ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4356ccd284c7SBarry Smith 435711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 435811a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 435911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4360ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4361ccd284c7SBarry Smith the above preallocation routines for simplicity. 4362ccd284c7SBarry Smith 4363ccd284c7SBarry Smith Options Database Keys: 436411a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 4365ccd284c7SBarry Smith 4366ccd284c7SBarry Smith Level: beginner 4367ccd284c7SBarry Smith 4368c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4369ccd284c7SBarry Smith M*/ 4370ccd284c7SBarry Smith 43717906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43727906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43737906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43747906f579SHong Zhang #endif 4375d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4376d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4377d24d4204SJose E. Roman #endif 43787906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43797906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43807906f579SHong Zhang #endif 43817906f579SHong Zhang 4382d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4383c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43844222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43857906f579SHong Zhang 43868c778c55SBarry Smith /*@C 438711a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43888c778c55SBarry Smith 43898c778c55SBarry Smith Not Collective 43908c778c55SBarry Smith 43918c778c55SBarry Smith Input Parameter: 439211a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43938c778c55SBarry Smith 43948c778c55SBarry Smith Output Parameter: 43958c778c55SBarry Smith . array - pointer to the data 43968c778c55SBarry Smith 43978c778c55SBarry Smith Level: intermediate 43988c778c55SBarry Smith 43990ab4885dSBarry Smith Fortran Note: 44000ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44010ab4885dSBarry Smith 4402db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44038c778c55SBarry Smith @*/ 4404d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4405d71ae5a4SJacob Faibussowitsch { 4406d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44078c778c55SBarry Smith 44088c778c55SBarry Smith PetscFunctionBegin; 4409d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44109566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4411d67d9f35SJunchao Zhang } else { 4412d67d9f35SJunchao Zhang *array = aij->a; 4413d67d9f35SJunchao Zhang } 44143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4415d67d9f35SJunchao Zhang } 4416d67d9f35SJunchao Zhang 4417d67d9f35SJunchao Zhang /*@C 441811a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4419d67d9f35SJunchao Zhang 4420d67d9f35SJunchao Zhang Not Collective 4421d67d9f35SJunchao Zhang 4422d67d9f35SJunchao Zhang Input Parameters: 442311a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4424d67d9f35SJunchao Zhang - array - pointer to the data 4425d67d9f35SJunchao Zhang 4426d67d9f35SJunchao Zhang Level: intermediate 4427d67d9f35SJunchao Zhang 44280ab4885dSBarry Smith Fortran Note: 44290ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44300ab4885dSBarry Smith 4431db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4432d67d9f35SJunchao Zhang @*/ 4433d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4434d71ae5a4SJacob Faibussowitsch { 4435d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4436d67d9f35SJunchao Zhang 4437d67d9f35SJunchao Zhang PetscFunctionBegin; 4438d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44399566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4440d67d9f35SJunchao Zhang } else { 4441d67d9f35SJunchao Zhang *array = NULL; 4442d67d9f35SJunchao Zhang } 44439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44449566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44468c778c55SBarry Smith } 44478c778c55SBarry Smith 444821e72a00SBarry Smith /*@C 444911a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44508f1ea47aSStefano Zampini 44510ab4885dSBarry Smith Not Collective; No Fortran Support 44528f1ea47aSStefano Zampini 44538f1ea47aSStefano Zampini Input Parameter: 445411a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44558f1ea47aSStefano Zampini 44568f1ea47aSStefano Zampini Output Parameter: 44578f1ea47aSStefano Zampini . array - pointer to the data 44588f1ea47aSStefano Zampini 44598f1ea47aSStefano Zampini Level: intermediate 44608f1ea47aSStefano Zampini 4461db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44628f1ea47aSStefano Zampini @*/ 4463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4464d71ae5a4SJacob Faibussowitsch { 4465d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44668f1ea47aSStefano Zampini 44678f1ea47aSStefano Zampini PetscFunctionBegin; 4468d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44699566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4470d67d9f35SJunchao Zhang } else { 4471d67d9f35SJunchao Zhang *array = aij->a; 4472d67d9f35SJunchao Zhang } 44733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44748f1ea47aSStefano Zampini } 44758f1ea47aSStefano Zampini 44768f1ea47aSStefano Zampini /*@C 447711a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44788f1ea47aSStefano Zampini 44790ab4885dSBarry Smith Not Collective; No Fortran Support 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini Input Parameter: 448211a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44838f1ea47aSStefano Zampini 44848f1ea47aSStefano Zampini Output Parameter: 44858f1ea47aSStefano Zampini . array - pointer to the data 44868f1ea47aSStefano Zampini 44878f1ea47aSStefano Zampini Level: intermediate 44888f1ea47aSStefano Zampini 4489db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44908f1ea47aSStefano Zampini @*/ 4491d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4492d71ae5a4SJacob Faibussowitsch { 4493d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44948f1ea47aSStefano Zampini 44958f1ea47aSStefano Zampini PetscFunctionBegin; 4496d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44979566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4498d67d9f35SJunchao Zhang } else { 4499d67d9f35SJunchao Zhang *array = NULL; 4500d67d9f35SJunchao Zhang } 45013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4502d67d9f35SJunchao Zhang } 4503d67d9f35SJunchao Zhang 4504d67d9f35SJunchao Zhang /*@C 450511a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4506d67d9f35SJunchao Zhang 45070ab4885dSBarry Smith Not Collective; No Fortran Support 4508d67d9f35SJunchao Zhang 4509d67d9f35SJunchao Zhang Input Parameter: 451011a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4511d67d9f35SJunchao Zhang 4512d67d9f35SJunchao Zhang Output Parameter: 4513d67d9f35SJunchao Zhang . array - pointer to the data 4514d67d9f35SJunchao Zhang 4515d67d9f35SJunchao Zhang Level: intermediate 4516d67d9f35SJunchao Zhang 4517db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4518d67d9f35SJunchao Zhang @*/ 4519d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4520d71ae5a4SJacob Faibussowitsch { 4521d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4522d67d9f35SJunchao Zhang 4523d67d9f35SJunchao Zhang PetscFunctionBegin; 4524d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45259566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4526d67d9f35SJunchao Zhang } else { 4527d67d9f35SJunchao Zhang *array = aij->a; 4528d67d9f35SJunchao Zhang } 45299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45309566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4532d67d9f35SJunchao Zhang } 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang /*@C 4535d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4536d67d9f35SJunchao Zhang 45370ab4885dSBarry Smith Not Collective; No Fortran Support 4538d67d9f35SJunchao Zhang 4539d67d9f35SJunchao Zhang Input Parameter: 4540d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4541d67d9f35SJunchao Zhang 4542d67d9f35SJunchao Zhang Output Parameter: 4543d67d9f35SJunchao Zhang . array - pointer to the data 4544d67d9f35SJunchao Zhang 4545d67d9f35SJunchao Zhang Level: intermediate 4546d67d9f35SJunchao Zhang 4547db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4548d67d9f35SJunchao Zhang @*/ 4549d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4550d71ae5a4SJacob Faibussowitsch { 4551d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4552d67d9f35SJunchao Zhang 4553d67d9f35SJunchao Zhang PetscFunctionBegin; 4554d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45559566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4556d67d9f35SJunchao Zhang } else { 4557d67d9f35SJunchao Zhang *array = NULL; 4558d67d9f35SJunchao Zhang } 45593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45608f1ea47aSStefano Zampini } 45618f1ea47aSStefano Zampini 45628f1ea47aSStefano Zampini /*@C 456311a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45647ee59b9bSJunchao Zhang 45650ab4885dSBarry Smith Not Collective; No Fortran Support 45667ee59b9bSJunchao Zhang 45677ee59b9bSJunchao Zhang Input Parameter: 456811a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45697ee59b9bSJunchao Zhang 45707ee59b9bSJunchao Zhang Output Parameters: 45717ee59b9bSJunchao Zhang + i - row map array of the matrix 45727ee59b9bSJunchao Zhang . j - column index array of the matrix 45737ee59b9bSJunchao Zhang . a - data array of the matrix 45747ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45757ee59b9bSJunchao Zhang 45767ee59b9bSJunchao Zhang Notes: 45777ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45787ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45797ee59b9bSJunchao Zhang 45807ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45817ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45827ee59b9bSJunchao Zhang 45837ee59b9bSJunchao Zhang Level: Developer 45847ee59b9bSJunchao Zhang 4585db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45867ee59b9bSJunchao Zhang @*/ 4587d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4588d71ae5a4SJacob Faibussowitsch { 45897ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45907ee59b9bSJunchao Zhang 45917ee59b9bSJunchao Zhang PetscFunctionBegin; 45927ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45937ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45947ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45957ee59b9bSJunchao Zhang } else { 45967ee59b9bSJunchao Zhang if (i) *i = aij->i; 45977ee59b9bSJunchao Zhang if (j) *j = aij->j; 45987ee59b9bSJunchao Zhang if (a) *a = aij->a; 45997ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46007ee59b9bSJunchao Zhang } 46013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46027ee59b9bSJunchao Zhang } 46037ee59b9bSJunchao Zhang 46047ee59b9bSJunchao Zhang /*@C 460521e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 460621e72a00SBarry Smith 460721e72a00SBarry Smith Not Collective 460821e72a00SBarry Smith 460921e72a00SBarry Smith Input Parameter: 461011a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 461121e72a00SBarry Smith 461221e72a00SBarry Smith Output Parameter: 461321e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 461421e72a00SBarry Smith 461521e72a00SBarry Smith Level: intermediate 461621e72a00SBarry Smith 4617db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 461821e72a00SBarry Smith @*/ 4619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4620d71ae5a4SJacob Faibussowitsch { 462121e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 462221e72a00SBarry Smith 462321e72a00SBarry Smith PetscFunctionBegin; 462421e72a00SBarry Smith *nz = aij->rmax; 46253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 462621e72a00SBarry Smith } 462721e72a00SBarry Smith 4628d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4629d71ae5a4SJacob Faibussowitsch { 4630394ed5ebSJunchao Zhang MPI_Comm comm; 4631394ed5ebSJunchao Zhang PetscInt *i, *j; 4632394ed5ebSJunchao Zhang PetscInt M, N, row; 4633394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4634394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4635394ed5ebSJunchao Zhang PetscInt *Aj; 4636394ed5ebSJunchao Zhang PetscScalar *Aa; 4637cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4638cbc6b225SStefano Zampini MatType rtype; 4639394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4640394ed5ebSJunchao Zhang 4641394ed5ebSJunchao Zhang PetscFunctionBegin; 46429566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46439566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46449566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4645e8729f6fSJunchao Zhang i = coo_i; 4646e8729f6fSJunchao Zhang j = coo_j; 46479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4648394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4649394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4650394ed5ebSJunchao Zhang perm[k] = k; 4651394ed5ebSJunchao Zhang } 4652394ed5ebSJunchao Zhang 4653394ed5ebSJunchao Zhang /* Sort by row */ 46549566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46559371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46569371c9d4SSatish Balay if (i[k] >= 0) break; 46579371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4658394ed5ebSJunchao Zhang nneg = k; 46599566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4660394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 466135cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4662394ed5ebSJunchao Zhang 46639566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4665394ed5ebSJunchao Zhang 4666394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 466735cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4668394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4669394ed5ebSJunchao Zhang while (k < coo_n) { 4670394ed5ebSJunchao Zhang row = i[k]; 4671394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4672394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4673394ed5ebSJunchao Zhang end = k; 46749566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4675394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4676394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4677394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4678394ed5ebSJunchao Zhang Ai[row] = 1; 4679394ed5ebSJunchao Zhang nnz++; 4680394ed5ebSJunchao Zhang 4681394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4682394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4683394ed5ebSJunchao Zhang q++; 4684394ed5ebSJunchao Zhang jmap[q] = 1; 4685394ed5ebSJunchao Zhang Aj[q] = j[p]; 4686394ed5ebSJunchao Zhang Ai[row]++; 4687394ed5ebSJunchao Zhang nnz++; 4688394ed5ebSJunchao Zhang } else { 4689394ed5ebSJunchao Zhang jmap[q]++; 4690394ed5ebSJunchao Zhang } 4691394ed5ebSJunchao Zhang } 4692394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4693394ed5ebSJunchao Zhang } 4694394ed5ebSJunchao Zhang 4695394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4696394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4697394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4698394ed5ebSJunchao Zhang jmap[0] = 0; 4699394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4700394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4701394ed5ebSJunchao Zhang PetscCount *jmap_new; 4702394ed5ebSJunchao Zhang PetscInt *Aj_new; 4703394ed5ebSJunchao Zhang 47049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47069566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4707394ed5ebSJunchao Zhang jmap = jmap_new; 4708394ed5ebSJunchao Zhang 47099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 47109566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47119566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4712394ed5ebSJunchao Zhang Aj = Aj_new; 4713394ed5ebSJunchao Zhang } 4714394ed5ebSJunchao Zhang 4715394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4716394ed5ebSJunchao Zhang PetscCount *perm_new; 4717cbc6b225SStefano Zampini 47189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47199566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47209566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4721394ed5ebSJunchao Zhang perm = perm_new; 4722394ed5ebSJunchao Zhang } 4723394ed5ebSJunchao Zhang 47249566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47259566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47269566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4727394ed5ebSJunchao Zhang 4728394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4729394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4730394ed5ebSJunchao Zhang /* Record COO fields */ 4731394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4732394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4733394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4734394ed5ebSJunchao Zhang seqaij->perm = perm; 47353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4736394ed5ebSJunchao Zhang } 4737394ed5ebSJunchao Zhang 4738d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4739d71ae5a4SJacob Faibussowitsch { 4740394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4741394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4742394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4743394ed5ebSJunchao Zhang PetscScalar *Aa; 4744394ed5ebSJunchao Zhang 4745394ed5ebSJunchao Zhang PetscFunctionBegin; 47469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4747394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4748b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4749b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4750b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4751394ed5ebSJunchao Zhang } 47529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 47533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4754394ed5ebSJunchao Zhang } 4755394ed5ebSJunchao Zhang 475634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47575063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 475802fe1965SBarry Smith #endif 4759d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4760d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4761d5e393b6SSuyash Tandon #endif 47623d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47635063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47643d0639e7SStefano Zampini #endif 476502fe1965SBarry Smith 4766d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4767d71ae5a4SJacob Faibussowitsch { 4768273d9f13SBarry Smith Mat_SeqAIJ *b; 476938baddfdSBarry Smith PetscMPIInt size; 4770273d9f13SBarry Smith 4771273d9f13SBarry Smith PetscFunctionBegin; 47729566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 477308401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4774273d9f13SBarry Smith 47754dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47762205254eSKarl Rupp 4777b0a32e0cSBarry Smith B->data = (void *)b; 47782205254eSKarl Rupp 47799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4780071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47812205254eSKarl Rupp 4782f4259b30SLisandro Dalcin b->row = NULL; 4783f4259b30SLisandro Dalcin b->col = NULL; 4784f4259b30SLisandro Dalcin b->icol = NULL; 4785b810aeb4SBarry Smith b->reallocs = 0; 478636db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4787f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4788416022c9SBarry Smith b->nonew = 0; 4789f4259b30SLisandro Dalcin b->diag = NULL; 4790f4259b30SLisandro Dalcin b->solve_work = NULL; 4791f4259b30SLisandro Dalcin B->spptr = NULL; 4792f4259b30SLisandro Dalcin b->saved_values = NULL; 4793f4259b30SLisandro Dalcin b->idiag = NULL; 4794f4259b30SLisandro Dalcin b->mdiag = NULL; 4795f4259b30SLisandro Dalcin b->ssor_work = NULL; 479671f1c65dSBarry Smith b->omega = 1.0; 479771f1c65dSBarry Smith b->fshift = 0.0; 479871f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4799bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4800a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 480117ab2063SBarry Smith 48029566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4803d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4806b3866ffcSBarry Smith #endif 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 48109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48149779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4816191b95cbSRichard Tran Mills #endif 481734b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 482102fe1965SBarry Smith #endif 4822d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4823d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4824d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4825d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4826d5e393b6SSuyash Tandon #endif 48273d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48293d0639e7SStefano Zampini #endif 48309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4831af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4833af8000cdSHong Zhang #endif 4834d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4836d24d4204SJose E. Roman #endif 483763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 484063c07aadSStefano Zampini #endif 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48569566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48579566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 486017ab2063SBarry Smith } 486117ab2063SBarry Smith 4862b24902e0SBarry Smith /* 48633893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4864b24902e0SBarry Smith */ 4865d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4866d71ae5a4SJacob Faibussowitsch { 48672a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4868071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 486917ab2063SBarry Smith 48703a40ed3dSBarry Smith PetscFunctionBegin; 4871aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4872273d9f13SBarry Smith 4873d5f3da31SBarry Smith C->factortype = A->factortype; 4874f4259b30SLisandro Dalcin c->row = NULL; 4875f4259b30SLisandro Dalcin c->col = NULL; 4876f4259b30SLisandro Dalcin c->icol = NULL; 48776ad4291fSHong Zhang c->reallocs = 0; 487817ab2063SBarry Smith 487969272f91SPierre Jolivet C->assembled = A->assembled; 488069272f91SPierre Jolivet C->preallocated = A->preallocated; 488117ab2063SBarry Smith 488269272f91SPierre Jolivet if (A->preallocated) { 48839566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48849566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4885eec197d1SBarry Smith 48869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48879566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48899566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 489017ab2063SBarry Smith 489117ab2063SBarry Smith /* allocate the matrix space */ 4892f77e22a1SHong Zhang if (mallocmatspace) { 48939566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48942205254eSKarl Rupp 4895f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48962205254eSKarl Rupp 48979566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 489817ab2063SBarry Smith if (m > 0) { 48999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4900be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49012e5835c6SStefano Zampini const PetscScalar *aa; 49022e5835c6SStefano Zampini 49039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4906be6bf707SBarry Smith } else { 49079566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 490817ab2063SBarry Smith } 490908480c60SBarry Smith } 4910f77e22a1SHong Zhang } 491117ab2063SBarry Smith 49126ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4913416022c9SBarry Smith c->roworiented = a->roworiented; 4914416022c9SBarry Smith c->nonew = a->nonew; 4915416022c9SBarry Smith if (a->diag) { 49169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 49179566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4918071fcb05SBarry Smith } else c->diag = NULL; 49192205254eSKarl Rupp 4920f4259b30SLisandro Dalcin c->solve_work = NULL; 4921f4259b30SLisandro Dalcin c->saved_values = NULL; 4922f4259b30SLisandro Dalcin c->idiag = NULL; 4923f4259b30SLisandro Dalcin c->ssor_work = NULL; 4924a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4925e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4926e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49276ad4291fSHong Zhang 4928893ad86cSHong Zhang c->rmax = a->rmax; 4929416022c9SBarry Smith c->nz = a->nz; 49308ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4931754ec7b1SSatish Balay 49326ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49336ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4934cd6b891eSBarry Smith if (a->compressedrow.use) { 49356ad4291fSHong Zhang i = a->compressedrow.nrows; 49369566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 493927ea64f8SHong Zhang } else { 494027ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49410298fd71SBarry Smith c->compressedrow.i = NULL; 49420298fd71SBarry Smith c->compressedrow.rindex = NULL; 49436ad4291fSHong Zhang } 4944ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4945e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49464846f1f5SKris Buschelman 49479566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 494869272f91SPierre Jolivet } 49499566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 495117ab2063SBarry Smith } 495217ab2063SBarry Smith 4953d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4954d71ae5a4SJacob Faibussowitsch { 4955b24902e0SBarry Smith PetscFunctionBegin; 49569566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49579566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 495848a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49599566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49609566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 49613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4962b24902e0SBarry Smith } 4963b24902e0SBarry Smith 4964d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4965d71ae5a4SJacob Faibussowitsch { 496652f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 496752f91c60SVaclav Hapla 496852f91c60SVaclav Hapla PetscFunctionBegin; 496952f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 497052f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4971c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49729566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49739566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49749566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 497552f91c60SVaclav Hapla if (isbinary) { 49769566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 497752f91c60SVaclav Hapla } else if (ishdf5) { 497852f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49799566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 498052f91c60SVaclav Hapla #else 498152f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 498252f91c60SVaclav Hapla #endif 498352f91c60SVaclav Hapla } else { 498498921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 498552f91c60SVaclav Hapla } 49863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 498752f91c60SVaclav Hapla } 498852f91c60SVaclav Hapla 4989d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4990d71ae5a4SJacob Faibussowitsch { 49913ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49923ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4993fbdbba38SShri Abhyankar 4994fbdbba38SShri Abhyankar PetscFunctionBegin; 49959566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4996bbead8a2SBarry Smith 49973ea6fe3dSLisandro Dalcin /* read in matrix header */ 49989566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 499908401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50009371c9d4SSatish Balay M = header[1]; 50019371c9d4SSatish Balay N = header[2]; 50029371c9d4SSatish Balay nz = header[3]; 500308401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 500408401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 500508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5006fbdbba38SShri Abhyankar 50073ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50089566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 50093ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50103ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50113ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50123ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50133ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50149566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50159566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50163ea6fe3dSLisandro Dalcin 50173ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50189566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5019aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50203ea6fe3dSLisandro Dalcin 5021fbdbba38SShri Abhyankar /* read in row lengths */ 50229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50239566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50243ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50259371c9d4SSatish Balay sum = 0; 50269371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 502708401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50283ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50309566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5031aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50323ea6fe3dSLisandro Dalcin /* store row lengths */ 50339566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50349566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5035fbdbba38SShri Abhyankar 50363ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50379371c9d4SSatish Balay a->i[0] = 0; 50389371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50393ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50409566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50413ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50429566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5043fbdbba38SShri Abhyankar 50449566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50459566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 50463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5047fbdbba38SShri Abhyankar } 5048fbdbba38SShri Abhyankar 5049d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5050d71ae5a4SJacob Faibussowitsch { 50517264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5052fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5053eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5054eeffb40dSHong Zhang PetscInt k; 5055eeffb40dSHong Zhang #endif 50567264ac53SSatish Balay 50573a40ed3dSBarry Smith PetscFunctionBegin; 5058bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5059d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5060ca44d042SBarry Smith *flg = PETSC_FALSE; 50613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5062bcd2baecSBarry Smith } 50637264ac53SSatish Balay 50647264ac53SSatish Balay /* if the a->i are the same */ 50659566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 50663ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 50677264ac53SSatish Balay 50687264ac53SSatish Balay /* if a->j are the same */ 50699566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 50703ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5071bcd2baecSBarry Smith 50729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5074bcd2baecSBarry Smith /* if a->a are the same */ 5075eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5076eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5077fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5078eeffb40dSHong Zhang *flg = PETSC_FALSE; 50793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5080eeffb40dSHong Zhang } 5081eeffb40dSHong Zhang } 5082eeffb40dSHong Zhang #else 50839566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5084eeffb40dSHong Zhang #endif 50859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 50873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 50887264ac53SSatish Balay } 508936db0b34SBarry Smith 509005869f15SSatish Balay /*@ 509111a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 509236db0b34SBarry Smith provided by the user. 509336db0b34SBarry Smith 5094d083f849SBarry Smith Collective 509536db0b34SBarry Smith 509636db0b34SBarry Smith Input Parameters: 509736db0b34SBarry Smith + comm - must be an MPI communicator of size 1 509836db0b34SBarry Smith . m - number of rows 509936db0b34SBarry Smith . n - number of columns 5100483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 510136db0b34SBarry Smith . j - column indices 510236db0b34SBarry Smith - a - matrix values 510336db0b34SBarry Smith 510436db0b34SBarry Smith Output Parameter: 510536db0b34SBarry Smith . mat - the matrix 510636db0b34SBarry Smith 510736db0b34SBarry Smith Level: intermediate 510836db0b34SBarry Smith 510936db0b34SBarry Smith Notes: 51100551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5111292fb18eSBarry Smith once the matrix is destroyed and not before 511236db0b34SBarry Smith 511336db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 511436db0b34SBarry Smith 5115bfeeae90SHong Zhang The i and j indices are 0 based 511636db0b34SBarry Smith 5117a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5118a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51198eef79e4SBarry Smith as shown 5120a4552177SSatish Balay 51218eef79e4SBarry Smith $ 1 0 0 51228eef79e4SBarry Smith $ 2 0 3 51238eef79e4SBarry Smith $ 4 5 6 51248eef79e4SBarry Smith $ 51258eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51268eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51278eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5128a4552177SSatish Balay 5129db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 513036db0b34SBarry Smith @*/ 5131d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5132d71ae5a4SJacob Faibussowitsch { 5133cbcfb4deSHong Zhang PetscInt ii; 513436db0b34SBarry Smith Mat_SeqAIJ *aij; 5135cbcfb4deSHong Zhang PetscInt jj; 513636db0b34SBarry Smith 513736db0b34SBarry Smith PetscFunctionBegin; 5138aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51399566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51409566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51419566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51429566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5144ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5147ab93d7beSBarry Smith 514836db0b34SBarry Smith aij->i = i; 514936db0b34SBarry Smith aij->j = j; 515036db0b34SBarry Smith aij->a = a; 515136db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 515236db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5153e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5154e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 515536db0b34SBarry Smith 5156cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 515736db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 515876bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5159aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51609985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 516108401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 516208401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51639985e31cSBarry Smith } 516436db0b34SBarry Smith } 516576bd3646SJed Brown } 516676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 516736db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 516808401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5169aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 517036db0b34SBarry Smith } 517176bd3646SJed Brown } 517236db0b34SBarry Smith 51739566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51749566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 517636db0b34SBarry Smith } 5177cbc6b225SStefano Zampini 5178f62e3866SBarry Smith /*@ 517911a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51808a0b0e6bSVictor Minden provided by the user. 51818a0b0e6bSVictor Minden 5182d083f849SBarry Smith Collective 51838a0b0e6bSVictor Minden 51848a0b0e6bSVictor Minden Input Parameters: 51858a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51868a0b0e6bSVictor Minden . m - number of rows 51878a0b0e6bSVictor Minden . n - number of columns 51888a0b0e6bSVictor Minden . i - row indices 51898a0b0e6bSVictor Minden . j - column indices 51901230e6d1SVictor Minden . a - matrix values 51911230e6d1SVictor Minden . nz - number of nonzeros 519211a5261eSBarry Smith - idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51938a0b0e6bSVictor Minden 51948a0b0e6bSVictor Minden Output Parameter: 51958a0b0e6bSVictor Minden . mat - the matrix 51968a0b0e6bSVictor Minden 51978a0b0e6bSVictor Minden Level: intermediate 51988a0b0e6bSVictor Minden 5199f62e3866SBarry Smith Example: 5200f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52019e99939fSJunchao Zhang .vb 52028a0b0e6bSVictor Minden 1 0 0 52038a0b0e6bSVictor Minden 2 0 3 52048a0b0e6bSVictor Minden 4 5 6 52058a0b0e6bSVictor Minden 52068a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52078a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52088a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52099e99939fSJunchao Zhang .ve 5210d7547e51SJunchao Zhang Notes: 5211d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5212d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52138a0b0e6bSVictor Minden 5214d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52158a0b0e6bSVictor Minden @*/ 5216d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5217d71ae5a4SJacob Faibussowitsch { 5218d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52198a0b0e6bSVictor Minden 52208a0b0e6bSVictor Minden PetscFunctionBegin; 52219566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5222ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52239566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52249566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52259566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52271230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52281230e6d1SVictor Minden if (idx) { 52291230e6d1SVictor Minden row = i[ii] - 1; 52301230e6d1SVictor Minden col = j[ii] - 1; 52311230e6d1SVictor Minden } else { 52321230e6d1SVictor Minden row = i[ii]; 52331230e6d1SVictor Minden col = j[ii]; 52348a0b0e6bSVictor Minden } 52359566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52368a0b0e6bSVictor Minden } 52379566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52389566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52399566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52418a0b0e6bSVictor Minden } 524236db0b34SBarry Smith 5243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5244d71ae5a4SJacob Faibussowitsch { 5245acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5246acf2f550SJed Brown 5247acf2f550SJed Brown PetscFunctionBegin; 5248acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5249acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52502205254eSKarl Rupp 52519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 52523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5253acf2f550SJed Brown } 5254acf2f550SJed Brown 5255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5256d71ae5a4SJacob Faibussowitsch { 52579c8f2541SHong Zhang PetscFunctionBegin; 52589566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52609c8f2541SHong Zhang } 52619c8f2541SHong Zhang 526281824310SBarry Smith /* 526353dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 526453dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 526553dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 526653dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 526753dd7562SDmitry Karpeev */ 5268d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5269d71ae5a4SJacob Faibussowitsch { 527053dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 527153dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 527253dd7562SDmitry Karpeev PetscBool seqaij; 527353dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 527453dd7562SDmitry Karpeev PetscScalar v; 527553dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 527653dd7562SDmitry Karpeev 527753dd7562SDmitry Karpeev PetscFunctionBegin; 52783ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 527953dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52809566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 528128b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 528253dd7562SDmitry Karpeev if (rowemb) { 52839566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 528408401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 528553dd7562SDmitry Karpeev } else { 528608401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 528753dd7562SDmitry Karpeev } 528853dd7562SDmitry Karpeev if (colemb) { 52899566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 529008401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 529153dd7562SDmitry Karpeev } else { 529208401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 529353dd7562SDmitry Karpeev } 529453dd7562SDmitry Karpeev 529553dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 529653dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 52979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5298ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 52999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53009566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 530153dd7562SDmitry Karpeev } 530248a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 530353dd7562SDmitry Karpeev count = 0; 530453dd7562SDmitry Karpeev rowindices = NULL; 530553dd7562SDmitry Karpeev colindices = NULL; 530648a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 530748a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 530853dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 530953dd7562SDmitry Karpeev PetscInt row; 531053dd7562SDmitry Karpeev row = i; 531153dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 531253dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 531353dd7562SDmitry Karpeev PetscInt col; 531453dd7562SDmitry Karpeev col = Baij->j[count]; 531553dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 531653dd7562SDmitry Karpeev v = Baij->a[count]; 53179566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 531853dd7562SDmitry Karpeev ++count; 531953dd7562SDmitry Karpeev } 532053dd7562SDmitry Karpeev } 532153dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 532253dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 532353dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 532453dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 532553dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 53263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 532753dd7562SDmitry Karpeev } 532853dd7562SDmitry Karpeev 5329dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A) 5330dec0b466SHong Zhang { 5331dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5332dec0b466SHong Zhang MatScalar *aa = a->a; 5333dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5334dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5335dec0b466SHong Zhang 5336dec0b466SHong Zhang PetscFunctionBegin; 5337dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5338dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5339dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5340dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5341dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 5342dec0b466SHong Zhang if (aa[k] == 0 && aj[k] != i - 1) fshift++; 5343dec0b466SHong Zhang else { 5344dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5345dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5346dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5347dec0b466SHong Zhang } 5348dec0b466SHong Zhang } 5349dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5350dec0b466SHong Zhang fshift_prev = fshift; 5351dec0b466SHong Zhang /* reset ilen and imax for each row */ 5352dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5353dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5354dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5355dec0b466SHong Zhang } 5356dec0b466SHong Zhang if (m) { 5357dec0b466SHong Zhang ai[m] -= fshift; 5358dec0b466SHong Zhang a->nz = ai[m]; 5359dec0b466SHong Zhang } 5360dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5361dec0b466SHong Zhang A->nonzerostate -= fshift; 5362dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5363dec0b466SHong Zhang a->rmax = rmax; 5364dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5365dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5366dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 53673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5368dec0b466SHong Zhang } 5369dec0b466SHong Zhang 53704099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53714099cc6bSBarry Smith 53724099cc6bSBarry Smith /*@C 537311a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53744099cc6bSBarry Smith 5375c3339decSBarry Smith Collective 53764099cc6bSBarry Smith 53774099cc6bSBarry Smith Input Parameters: 53784099cc6bSBarry Smith + mat - the matrix object 53794099cc6bSBarry Smith - matype - matrix type 53804099cc6bSBarry Smith 53814099cc6bSBarry Smith Options Database Key: 53824e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 53834099cc6bSBarry Smith 53844099cc6bSBarry Smith Level: intermediate 53854099cc6bSBarry Smith 5386db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53874099cc6bSBarry Smith @*/ 5388d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5389d71ae5a4SJacob Faibussowitsch { 53904099cc6bSBarry Smith PetscBool sametype; 53915f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53924099cc6bSBarry Smith 53934099cc6bSBarry Smith PetscFunctionBegin; 53944099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53963ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 53974099cc6bSBarry Smith 53989566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 53995f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 54009566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 54013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54024099cc6bSBarry Smith } 54034099cc6bSBarry Smith 54044099cc6bSBarry Smith /*@C 540511a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 54064099cc6bSBarry Smith 54074099cc6bSBarry Smith Not Collective 54084099cc6bSBarry Smith 54094099cc6bSBarry Smith Input Parameters: 541011a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54114099cc6bSBarry Smith - function - routine to convert to subtype 54124099cc6bSBarry Smith 54134099cc6bSBarry Smith Notes: 541411a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54154099cc6bSBarry Smith 54164099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54174099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54184099cc6bSBarry Smith 54194099cc6bSBarry Smith Level: advanced 54204099cc6bSBarry Smith 5421db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()` 54224099cc6bSBarry Smith @*/ 5423d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5424d71ae5a4SJacob Faibussowitsch { 54254099cc6bSBarry Smith PetscFunctionBegin; 54269566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54279566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54294099cc6bSBarry Smith } 54304099cc6bSBarry Smith 54314099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54324099cc6bSBarry Smith 54334099cc6bSBarry Smith /*@C 543411a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54354099cc6bSBarry Smith 54364099cc6bSBarry Smith Not Collective 54374099cc6bSBarry Smith 54384099cc6bSBarry Smith Level: advanced 54394099cc6bSBarry Smith 5440db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()` 54414099cc6bSBarry Smith @*/ 5442d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5443d71ae5a4SJacob Faibussowitsch { 54444099cc6bSBarry Smith PetscFunctionBegin; 54453ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 54464099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54474099cc6bSBarry Smith 54489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54519779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5453485f9817SRichard Tran Mills #endif 54545063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54565063d097SStefano Zampini #endif 5457d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5458d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5459d5e393b6SSuyash Tandon #endif 54605063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54625063d097SStefano Zampini #endif 54634099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54654099cc6bSBarry Smith #endif 54663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54674099cc6bSBarry Smith } 546853dd7562SDmitry Karpeev 546953dd7562SDmitry Karpeev /* 547081824310SBarry Smith Special version for direct calls from Fortran 547181824310SBarry Smith */ 5472af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 547381824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 547481824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 547581824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 547681824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 547781824310SBarry Smith #endif 547881824310SBarry Smith 547981824310SBarry Smith /* Change these macros so can be used in void function */ 548098921bdaSJacob Faibussowitsch 548198921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54829566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54839566063dSJacob Faibussowitsch #undef PetscCall 54849371c9d4SSatish Balay #define PetscCall(...) \ 54859371c9d4SSatish Balay do { \ 54865f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 548798921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 548898921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 548998921bdaSJacob Faibussowitsch return; \ 549098921bdaSJacob Faibussowitsch } \ 549198921bdaSJacob Faibussowitsch } while (0) 549298921bdaSJacob Faibussowitsch 549398921bdaSJacob Faibussowitsch #undef SETERRQ 54949371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 54959371c9d4SSatish Balay do { \ 549698921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 549798921bdaSJacob Faibussowitsch return; \ 549898921bdaSJacob Faibussowitsch } while (0) 549981824310SBarry Smith 5500d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5501d71ae5a4SJacob Faibussowitsch { 550281824310SBarry Smith Mat A = *AA; 550381824310SBarry Smith PetscInt m = *mm, n = *nn; 550481824310SBarry Smith InsertMode is = *isis; 550581824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 550681824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 550781824310SBarry Smith PetscInt *imax, *ai, *ailen; 550881824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 550954f21887SBarry Smith MatScalar *ap, value, *aa; 5510ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5511ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 551281824310SBarry Smith 551381824310SBarry Smith PetscFunctionBegin; 55144994cf47SJed Brown MatCheckPreallocated(A, 1); 551581824310SBarry Smith imax = a->imax; 551681824310SBarry Smith ai = a->i; 551781824310SBarry Smith ailen = a->ilen; 551881824310SBarry Smith aj = a->j; 551981824310SBarry Smith aa = a->a; 552081824310SBarry Smith 552181824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 552281824310SBarry Smith row = im[k]; 552381824310SBarry Smith if (row < 0) continue; 55245f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55259371c9d4SSatish Balay rp = aj + ai[row]; 55269371c9d4SSatish Balay ap = aa + ai[row]; 55279371c9d4SSatish Balay rmax = imax[row]; 55289371c9d4SSatish Balay nrow = ailen[row]; 552981824310SBarry Smith low = 0; 553081824310SBarry Smith high = nrow; 553181824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 553281824310SBarry Smith if (in[l] < 0) continue; 55335f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 553481824310SBarry Smith col = in[l]; 55352205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55362205254eSKarl Rupp else value = v[k + l * m]; 55372205254eSKarl Rupp 553881824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 553981824310SBarry Smith 55402205254eSKarl Rupp if (col <= lastcol) low = 0; 55412205254eSKarl Rupp else high = nrow; 554281824310SBarry Smith lastcol = col; 554381824310SBarry Smith while (high - low > 5) { 554481824310SBarry Smith t = (low + high) / 2; 554581824310SBarry Smith if (rp[t] > col) high = t; 554681824310SBarry Smith else low = t; 554781824310SBarry Smith } 554881824310SBarry Smith for (i = low; i < high; i++) { 554981824310SBarry Smith if (rp[i] > col) break; 555081824310SBarry Smith if (rp[i] == col) { 555181824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 555281824310SBarry Smith else ap[i] = value; 555381824310SBarry Smith goto noinsert; 555481824310SBarry Smith } 555581824310SBarry Smith } 555681824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 555781824310SBarry Smith if (nonew == 1) goto noinsert; 55585f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5559fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 55609371c9d4SSatish Balay N = nrow++ - 1; 55619371c9d4SSatish Balay a->nz++; 55629371c9d4SSatish Balay high++; 556381824310SBarry Smith /* shift up all the later entries in this row */ 556481824310SBarry Smith for (ii = N; ii >= i; ii--) { 556581824310SBarry Smith rp[ii + 1] = rp[ii]; 556681824310SBarry Smith ap[ii + 1] = ap[ii]; 556781824310SBarry Smith } 556881824310SBarry Smith rp[i] = col; 556981824310SBarry Smith ap[i] = value; 5570e56f5c9eSBarry Smith A->nonzerostate++; 557181824310SBarry Smith noinsert:; 557281824310SBarry Smith low = i + 1; 557381824310SBarry Smith } 557481824310SBarry Smith ailen[row] = nrow; 557581824310SBarry Smith } 557681824310SBarry Smith PetscFunctionReturnVoid(); 557781824310SBarry Smith } 557898921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 557998921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 558098921bdaSJacob Faibussowitsch * original definitions */ 55819566063dSJacob Faibussowitsch #undef PetscCall 558298921bdaSJacob Faibussowitsch #undef SETERRQ 5583