1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 50857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 418720833daSHong Zhang rp = aj + ai[row]; 419876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 49619b08ed1SBarry Smith ap = aa + ai[row]; 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 53219b08ed1SBarry Smith 533d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 534d71ae5a4SJacob Faibussowitsch { 53519b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53619b08ed1SBarry Smith 53719b08ed1SBarry Smith PetscFunctionBegin; 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5399566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 54019b08ed1SBarry Smith a->maxnz = nztotal; 5414dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54219b08ed1SBarry Smith if (!a->ilen) { 5439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54419b08ed1SBarry Smith } else { 5459566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54619b08ed1SBarry Smith } 54719b08ed1SBarry Smith 54819b08ed1SBarry Smith /* allocate the matrix space */ 54919b08ed1SBarry Smith if (A->structure_only) { 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55219b08ed1SBarry Smith } else { 5539566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55419b08ed1SBarry Smith } 55519b08ed1SBarry Smith a->i[0] = 0; 55619b08ed1SBarry Smith if (A->structure_only) { 55719b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55819b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55919b08ed1SBarry Smith } else { 56019b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56119b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56219b08ed1SBarry Smith } 56319b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56419b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56519b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56719b08ed1SBarry Smith } 56819b08ed1SBarry Smith 569d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 570d71ae5a4SJacob Faibussowitsch { 571071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 572071fcb05SBarry Smith PetscInt *rp, k, row; 573071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 574071fcb05SBarry Smith PetscInt *aj = a->j; 575fff043a9SJunchao Zhang MatScalar *aa, *ap; 576071fcb05SBarry Smith 577071fcb05SBarry Smith PetscFunctionBegin; 5789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 579071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 580071fcb05SBarry Smith row = im[k]; 5816bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 582071fcb05SBarry Smith rp = aj + ai[row]; 583071fcb05SBarry Smith ap = aa + ai[row]; 58448a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 585071fcb05SBarry Smith if (!A->structure_only) { 586071fcb05SBarry Smith if (v) { 5879566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 588071fcb05SBarry Smith v += n; 589071fcb05SBarry Smith } else { 5909566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith } 593071fcb05SBarry Smith ailen[row] = n; 594071fcb05SBarry Smith a->nz += n; 595071fcb05SBarry Smith } 5969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 598071fcb05SBarry Smith } 599071fcb05SBarry Smith 600d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 601d71ae5a4SJacob Faibussowitsch { 6027eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60397f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60497f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6054e208921SJed Brown const MatScalar *ap, *aa; 6067eb43aa7SLois Curfman McInnes 6073a40ed3dSBarry Smith PetscFunctionBegin; 6084e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6097eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6107eb43aa7SLois Curfman McInnes row = im[k]; 6119371c9d4SSatish Balay if (row < 0) { 6129371c9d4SSatish Balay v += n; 6139371c9d4SSatish Balay continue; 6149371c9d4SSatish Balay } /* negative row */ 61554c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6169371c9d4SSatish Balay rp = aj + ai[row]; 6179371c9d4SSatish Balay ap = aa + ai[row]; 6187eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6197eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6209371c9d4SSatish Balay if (in[l] < 0) { 6219371c9d4SSatish Balay v++; 6229371c9d4SSatish Balay continue; 6239371c9d4SSatish Balay } /* negative column */ 62454c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 625bfeeae90SHong Zhang col = in[l]; 6269371c9d4SSatish Balay high = nrow; 6279371c9d4SSatish Balay low = 0; /* assume unsorted */ 6287eb43aa7SLois Curfman McInnes while (high - low > 5) { 6297eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6307eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6317eb43aa7SLois Curfman McInnes else low = t; 6327eb43aa7SLois Curfman McInnes } 6337eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6347eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6357eb43aa7SLois Curfman McInnes if (rp[i] == col) { 636b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6377eb43aa7SLois Curfman McInnes goto finished; 6387eb43aa7SLois Curfman McInnes } 6397eb43aa7SLois Curfman McInnes } 64097e567efSBarry Smith *v++ = 0.0; 6417eb43aa7SLois Curfman McInnes finished:; 6427eb43aa7SLois Curfman McInnes } 6437eb43aa7SLois Curfman McInnes } 6444e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6467eb43aa7SLois Curfman McInnes } 6477eb43aa7SLois Curfman McInnes 648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 649d71ae5a4SJacob Faibussowitsch { 6503ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 651c898d852SStefano Zampini const PetscScalar *av; 6523ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6533ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65417ab2063SBarry Smith 6553a40ed3dSBarry Smith PetscFunctionBegin; 6569566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6572205254eSKarl Rupp 6583ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6593ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6603ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6613ea6fe3dSLisandro Dalcin nz = A->nz; 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* write matrix header */ 6643ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6659371c9d4SSatish Balay header[1] = M; 6669371c9d4SSatish Balay header[2] = N; 6679371c9d4SSatish Balay header[3] = nz; 6689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 669416022c9SBarry Smith 6703ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6723ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6739566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6749566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6753ea6fe3dSLisandro Dalcin /* store column indices */ 6769566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 677416022c9SBarry Smith /* store nonzero values */ 6789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6799566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 681b37d52dbSMark F. Adams 6823ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6839566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68517ab2063SBarry Smith } 686416022c9SBarry Smith 687d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 688d71ae5a4SJacob Faibussowitsch { 6897dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6907dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6917dc0baabSHong Zhang 6927dc0baabSHong Zhang PetscFunctionBegin; 6939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6947dc0baabSHong Zhang for (i = 0; i < m; i++) { 6959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69648a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6987dc0baabSHong Zhang } 6999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 7003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7017dc0baabSHong Zhang } 7027dc0baabSHong Zhang 70309573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 704cd155464SBarry Smith 705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 706d71ae5a4SJacob Faibussowitsch { 707416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 708c898d852SStefano Zampini const PetscScalar *av; 70960e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 710e060cb09SBarry Smith const char *name; 711f3ef73ceSBarry Smith PetscViewerFormat format; 71217ab2063SBarry Smith 7133a40ed3dSBarry Smith PetscFunctionBegin; 7147dc0baabSHong Zhang if (A->structure_only) { 7159566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7177dc0baabSHong Zhang } 71843e49210SHong Zhang 7199566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7203ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7212e5835c6SStefano Zampini 722c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72571c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72697f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72760e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 728c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 729d00d2cf4SBarry Smith nofinalvalue = 1; 730d00d2cf4SBarry Smith } 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #else 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 738fbfe6fa7SJed Brown #endif 7399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 74017ab2063SBarry Smith 74117ab2063SBarry Smith for (i = 0; i < m; i++) { 74260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74517ab2063SBarry Smith #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74717ab2063SBarry Smith #endif 74817ab2063SBarry Smith } 74917ab2063SBarry Smith } 750d00d2cf4SBarry Smith if (nofinalvalue) { 751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 753c337ccceSJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 755c337ccceSJed Brown #endif 756d00d2cf4SBarry Smith } 7579566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 760fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76244cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 77036db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7726831982aSBarry Smith } 77344cd7ae7SLois Curfman McInnes #else 7749566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77544cd7ae7SLois Curfman McInnes #endif 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77844cd7ae7SLois Curfman McInnes } 7799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 780fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78197f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 784496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 785496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 787496be53dSLois Curfman McInnes if (a->j[j] >= i) { 788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 790496be53dSLois Curfman McInnes #else 791496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 792496be53dSLois Curfman McInnes #endif 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 795496be53dSLois Curfman McInnes } 7962e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7982e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7992205254eSKarl Rupp if (i + 4 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8012205254eSKarl Rupp } else if (i + 3 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8032205254eSKarl Rupp } else if (i + 2 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8052205254eSKarl Rupp } else if (i + 1 < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8072205254eSKarl Rupp } else if (i < m) { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8092205254eSKarl Rupp } else { 8109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8112205254eSKarl Rupp } 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8149566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 815496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8179566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes } 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 822496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 824496be53dSLois Curfman McInnes if (a->j[j] >= i) { 825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82648a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 827496be53dSLois Curfman McInnes #else 8289566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 829496be53dSLois Curfman McInnes #endif 830496be53dSLois Curfman McInnes } 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 833496be53dSLois Curfman McInnes } 8349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 835fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83697f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83787828ca2SBarry Smith PetscScalar value; 83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83968f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 84068f1ed48SBarry Smith 84168f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84268f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84368f1ed48SBarry Smith realonly = PETSC_FALSE; 84468f1ed48SBarry Smith break; 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith } 84768f1ed48SBarry Smith #endif 84802594712SBarry Smith 8499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 85002594712SBarry Smith for (i = 0; i < m; i++) { 85102594712SBarry Smith jcnt = 0; 852d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 853e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85402594712SBarry Smith value = a->a[cnt++]; 855e24b481bSBarry Smith jcnt++; 85602594712SBarry Smith } else { 85702594712SBarry Smith value = 0.0; 85802594712SBarry Smith } 859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86068f1ed48SBarry Smith if (realonly) { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86268f1ed48SBarry Smith } else { 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86468f1ed48SBarry Smith } 86502594712SBarry Smith #else 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86702594712SBarry Smith #endif 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 87002594712SBarry Smith } 8719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8723c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 873150b93efSMatthew G. Knepley PetscInt fshift = 1; 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8793c215bfdSMatthew Knepley #endif 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8813c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8853c215bfdSMatthew Knepley #else 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8873c215bfdSMatthew Knepley #endif 8883c215bfdSMatthew Knepley } 8893c215bfdSMatthew Knepley } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8913a40ed3dSBarry Smith } else { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 893d5f3da31SBarry Smith if (A->factortype) { 89416cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89616cd7e1dSShri Abhyankar /* L part */ 89760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90316cd7e1dSShri Abhyankar } else { 9049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90516cd7e1dSShri Abhyankar } 90616cd7e1dSShri Abhyankar #else 9079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90816cd7e1dSShri Abhyankar #endif 90916cd7e1dSShri Abhyankar } 91016cd7e1dSShri Abhyankar /* diagonal */ 91116cd7e1dSShri Abhyankar j = a->diag[i]; 91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91716cd7e1dSShri Abhyankar } else { 9189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91916cd7e1dSShri Abhyankar } 92016cd7e1dSShri Abhyankar #else 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92216cd7e1dSShri Abhyankar #endif 92316cd7e1dSShri Abhyankar 92416cd7e1dSShri Abhyankar /* U part */ 92560e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93116cd7e1dSShri Abhyankar } else { 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar #else 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93616cd7e1dSShri Abhyankar #endif 93716cd7e1dSShri Abhyankar } 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93916cd7e1dSShri Abhyankar } 94016cd7e1dSShri Abhyankar } else { 94117ab2063SBarry Smith for (i = 0; i < m; i++) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9493a40ed3dSBarry Smith } else { 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95117ab2063SBarry Smith } 95217ab2063SBarry Smith #else 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95417ab2063SBarry Smith #endif 95517ab2063SBarry Smith } 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95717ab2063SBarry Smith } 95816cd7e1dSShri Abhyankar } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 96017ab2063SBarry Smith } 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 963416022c9SBarry Smith } 964416022c9SBarry Smith 9659804daf3SBarry Smith #include <petscdraw.h> 966d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 967d71ae5a4SJacob Faibussowitsch { 968480ef9eaSBarry Smith Mat A = (Mat)Aa; 969416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 970383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 971383922c3SLisandro Dalcin int color; 972b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 973b0a32e0cSBarry Smith PetscViewer viewer; 974f3ef73ceSBarry Smith PetscViewerFormat format; 975fff043a9SJunchao Zhang const PetscScalar *aa; 976cddf8d76SBarry Smith 9773a40ed3dSBarry Smith PetscFunctionBegin; 9789566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9799566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9809566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 981383922c3SLisandro Dalcin 982416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 984fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 985d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9860513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 987b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 988416022c9SBarry Smith for (i = 0; i < m; i++) { 9899371c9d4SSatish Balay y_l = m - i - 1.0; 9909371c9d4SSatish Balay y_r = y_l + 1.0; 991bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9929371c9d4SSatish Balay x_l = a->j[j]; 9939371c9d4SSatish Balay x_r = x_l + 1.0; 994fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9959566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 996cddf8d76SBarry Smith } 997cddf8d76SBarry Smith } 998b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 999cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10009371c9d4SSatish Balay y_l = m - i - 1.0; 10019371c9d4SSatish Balay y_r = y_l + 1.0; 1002bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10039371c9d4SSatish Balay x_l = a->j[j]; 10049371c9d4SSatish Balay x_r = x_l + 1.0; 1005fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1007cddf8d76SBarry Smith } 1008cddf8d76SBarry Smith } 1009b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1010cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10119371c9d4SSatish Balay y_l = m - i - 1.0; 10129371c9d4SSatish Balay y_r = y_l + 1.0; 1013bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10149371c9d4SSatish Balay x_l = a->j[j]; 10159371c9d4SSatish Balay x_r = x_l + 1.0; 1016fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10179566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1018416022c9SBarry Smith } 1019416022c9SBarry Smith } 1020d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10210513a670SBarry Smith } else { 10220513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10230513a670SBarry Smith /* first determine max of all nonzero values */ 1024b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1025383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1026b0a32e0cSBarry Smith PetscDraw popup; 10270513a670SBarry Smith 10280513a670SBarry Smith for (i = 0; i < nz; i++) { 1029fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10300513a670SBarry Smith } 1031383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10339566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1034383922c3SLisandro Dalcin 1035d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10360513a670SBarry Smith for (i = 0; i < m; i++) { 1037383922c3SLisandro Dalcin y_l = m - i - 1.0; 1038383922c3SLisandro Dalcin y_r = y_l + 1.0; 1039bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1040383922c3SLisandro Dalcin x_l = a->j[j]; 1041383922c3SLisandro Dalcin x_r = x_l + 1.0; 1042fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10439566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10440513a670SBarry Smith count++; 10450513a670SBarry Smith } 10460513a670SBarry Smith } 1047d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10480513a670SBarry Smith } 10499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1051480ef9eaSBarry Smith } 1052cddf8d76SBarry Smith 10539804daf3SBarry Smith #include <petscdraw.h> 1054d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1055d71ae5a4SJacob Faibussowitsch { 1056b0a32e0cSBarry Smith PetscDraw draw; 105736db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1058ace3abfcSBarry Smith PetscBool isnull; 1059480ef9eaSBarry Smith 1060480ef9eaSBarry Smith PetscFunctionBegin; 10619566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10629566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10633ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1064480ef9eaSBarry Smith 10659371c9d4SSatish Balay xr = A->cmap->n; 10669371c9d4SSatish Balay yr = A->rmap->n; 10679371c9d4SSatish Balay h = yr / 10.0; 10689371c9d4SSatish Balay w = xr / 10.0; 10699371c9d4SSatish Balay xr += w; 10709371c9d4SSatish Balay yr += h; 10719371c9d4SSatish Balay xl = -w; 10729371c9d4SSatish Balay yl = -h; 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10769566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10779566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1079416022c9SBarry Smith } 1080416022c9SBarry Smith 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1082d71ae5a4SJacob Faibussowitsch { 1083ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1084416022c9SBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10891baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10901baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10911baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10929566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109417ab2063SBarry Smith } 109519bcc07fSBarry Smith 1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1097d71ae5a4SJacob Faibussowitsch { 1098416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1099580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1100d0f46423SBarry Smith PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0; 110154f21887SBarry Smith MatScalar *aa = a->a, *ap; 11023447b6efSHong Zhang PetscReal ratio = 0.6; 110317ab2063SBarry Smith 11043a40ed3dSBarry Smith PetscFunctionBegin; 11053ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1107b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1108b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111b215bc84SStefano Zampini } 111217ab2063SBarry Smith 111343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111417ab2063SBarry Smith for (i = 1; i < m; i++) { 1115416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111617ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111794a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111817ab2063SBarry Smith if (fshift) { 1119bfeeae90SHong Zhang ip = aj + ai[i]; 1120bfeeae90SHong Zhang ap = aa + ai[i]; 112117ab2063SBarry Smith N = ailen[i]; 11229566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112417ab2063SBarry Smith } 112517ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112617ab2063SBarry Smith } 112717ab2063SBarry Smith if (m) { 112817ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112917ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 113017ab2063SBarry Smith } 113117ab2063SBarry Smith /* reset ilen and imax for each row */ 11327b083b7cSBarry Smith a->nonzerorowcnt = 0; 1133396832f4SHong Zhang if (A->structure_only) { 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1136396832f4SHong Zhang } else { /* !A->structure_only */ 113717ab2063SBarry Smith for (i = 0; i < m; i++) { 113817ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11397b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 114017ab2063SBarry Smith } 1141396832f4SHong Zhang } 1142bfeeae90SHong Zhang a->nz = ai[m]; 1143aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 114417ab2063SBarry Smith 11459566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11469566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11479566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11492205254eSKarl Rupp 11508e58a170SBarry Smith A->info.mallocs += a->reallocs; 1151dd5f02e7SSatish Balay a->reallocs = 0; 11526712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115336db0b34SBarry Smith a->rmax = rmax; 11544e220ebcSLois Curfman McInnes 115548a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11569566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115817ab2063SBarry Smith } 115917ab2063SBarry Smith 1160d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1161d71ae5a4SJacob Faibussowitsch { 116299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116399cafbc1SBarry Smith PetscInt i, nz = a->nz; 11642e5835c6SStefano Zampini MatScalar *aa; 116599cafbc1SBarry Smith 116699cafbc1SBarry Smith PetscFunctionBegin; 11679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117299cafbc1SBarry Smith } 117399cafbc1SBarry Smith 1174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1175d71ae5a4SJacob Faibussowitsch { 117699cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117799cafbc1SBarry Smith PetscInt i, nz = a->nz; 11782e5835c6SStefano Zampini MatScalar *aa; 117999cafbc1SBarry Smith 118099cafbc1SBarry Smith PetscFunctionBegin; 11819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118299cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118699cafbc1SBarry Smith } 118799cafbc1SBarry Smith 1188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1189d71ae5a4SJacob Faibussowitsch { 1190fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1191fff043a9SJunchao Zhang MatScalar *aa; 11923a40ed3dSBarry Smith 11933a40ed3dSBarry Smith PetscFunctionBegin; 11949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11959566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119917ab2063SBarry Smith } 1200416022c9SBarry Smith 1201d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1202d71ae5a4SJacob Faibussowitsch { 1203cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1204cbc6b225SStefano Zampini 1205cbc6b225SStefano Zampini PetscFunctionBegin; 12069566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12079566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 12083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1209cbc6b225SStefano Zampini } 1210cbc6b225SStefano Zampini 1211d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1212d71ae5a4SJacob Faibussowitsch { 1213416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1214d5d45c9bSBarry Smith 12153a40ed3dSBarry Smith PetscFunctionBegin; 1216*b4e2f619SBarry Smith if (A->hash_active) { 1217*b4e2f619SBarry Smith PetscCall(PetscMemcpy(&A->ops, &a->cops, sizeof(*(A->ops)))); 1218*b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1219*b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1220*b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1221*b4e2f619SBarry Smith } 1222*b4e2f619SBarry Smith 1223aa482453SBarry Smith #if defined(PETSC_USE_LOG) 12243ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 122517ab2063SBarry Smith #endif 12269566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12279566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12289566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12299566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12309566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12359566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12369566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12389566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12399566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12409566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12419566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1242901853e0SKris Buschelman 12436718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12446718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12456718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12466718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12476718818eSStefano Zampini due to different matrix sizes */ 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12496718818eSStefano Zampini 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12512e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12592e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12602e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12612e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12622e956fe4SStefano Zampini #endif 12634222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12674222ddf1SHong Zhang #endif 1268d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1269d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1270d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1271d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1272d5e393b6SSuyash Tandon #endif 12733d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12753d0639e7SStefano Zampini #endif 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1277af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1279af8000cdSHong Zhang #endif 1280d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1282d24d4204SJose E. Roman #endif 128363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 128663c07aadSStefano Zampini #endif 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12912e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 13022e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 13032e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13042e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 13052e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13062e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13072e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 131017ab2063SBarry Smith } 131117ab2063SBarry Smith 1312d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1313d71ae5a4SJacob Faibussowitsch { 1314416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13153a40ed3dSBarry Smith 13163a40ed3dSBarry Smith PetscFunctionBegin; 1317a65d3064SKris Buschelman switch (op) { 1318d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1319d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1320d71ae5a4SJacob Faibussowitsch break; 1321d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1322d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1323d71ae5a4SJacob Faibussowitsch break; 1324d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1325d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1326d71ae5a4SJacob Faibussowitsch break; 1327d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1328d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1329d71ae5a4SJacob Faibussowitsch break; 1330d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1331d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1332d71ae5a4SJacob Faibussowitsch break; 1333d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1334d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1335d71ae5a4SJacob Faibussowitsch break; 1336d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1337d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1338d71ae5a4SJacob Faibussowitsch break; 13393d472b54SHong Zhang case MAT_SPD: 1340b1646e73SJed Brown case MAT_SYMMETRIC: 1341b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1342b1646e73SJed Brown case MAT_HERMITIAN: 1343b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1344957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1345b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1346b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1347b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13485021d80fSJed Brown break; 13498c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1350a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1351d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1352d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1353d71ae5a4SJacob Faibussowitsch break; 1354d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1355d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1356d71ae5a4SJacob Faibussowitsch break; 1357d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1358d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360071fcb05SBarry Smith case MAT_SORTED_FULL: 1361071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1362071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1363071fcb05SBarry Smith break; 1364d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1365d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1366d71ae5a4SJacob Faibussowitsch break; 1367d71ae5a4SJacob Faibussowitsch default: 1368d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1369a65d3064SKris Buschelman } 13703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137117ab2063SBarry Smith } 137217ab2063SBarry Smith 1373d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1374d71ae5a4SJacob Faibussowitsch { 1375416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1376fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1377c898d852SStefano Zampini PetscScalar *x; 1378c898d852SStefano Zampini const PetscScalar *aa; 137917ab2063SBarry Smith 13803a40ed3dSBarry Smith PetscFunctionBegin; 13819566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 138208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1384d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1385d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13872c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13889566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139135e7444dSHong Zhang } 139235e7444dSHong Zhang 13939566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 139435e7444dSHong Zhang for (i = 0; i < n; i++) { 1395fdc842d1SBarry Smith x[i] = 0.0; 139635e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139735e7444dSHong Zhang if (aj[j] == i) { 139835e7444dSHong Zhang x[i] = aa[j]; 139917ab2063SBarry Smith break; 140017ab2063SBarry Smith } 140117ab2063SBarry Smith } 140217ab2063SBarry Smith } 14039566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 14049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 140617ab2063SBarry Smith } 140717ab2063SBarry Smith 1408c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1409d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1410d71ae5a4SJacob Faibussowitsch { 1411416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14125f22a7b3SSebastian Grimberg const MatScalar *aa; 1413d9ca1df4SBarry Smith PetscScalar *y; 1414d9ca1df4SBarry Smith const PetscScalar *x; 1415d0f46423SBarry Smith PetscInt m = A->rmap->n; 14165c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14175f22a7b3SSebastian Grimberg const MatScalar *v; 1418a77337e4SBarry Smith PetscScalar alpha; 1419d9ca1df4SBarry Smith PetscInt n, i, j; 1420d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14213447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1422ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14235c897100SBarry Smith #endif 142417ab2063SBarry Smith 14253a40ed3dSBarry Smith PetscFunctionBegin; 14269566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14279566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14289566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14305c897100SBarry Smith 14315c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1432fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14335c897100SBarry Smith #else 14343447b6efSHong Zhang if (usecprow) { 14353447b6efSHong Zhang m = cprow.nrows; 14363447b6efSHong Zhang ii = cprow.i; 14377b2bb3b9SHong Zhang ridx = cprow.rindex; 14383447b6efSHong Zhang } else { 14393447b6efSHong Zhang ii = a->i; 14403447b6efSHong Zhang } 144117ab2063SBarry Smith for (i = 0; i < m; i++) { 14423447b6efSHong Zhang idx = a->j + ii[i]; 1443fff043a9SJunchao Zhang v = aa + ii[i]; 14443447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14453447b6efSHong Zhang if (usecprow) { 14467b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14473447b6efSHong Zhang } else { 144817ab2063SBarry Smith alpha = x[i]; 14493447b6efSHong Zhang } 145004fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 145117ab2063SBarry Smith } 14525c897100SBarry Smith #endif 14539566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14549566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14559566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145817ab2063SBarry Smith } 145917ab2063SBarry Smith 1460d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1461d71ae5a4SJacob Faibussowitsch { 14625c897100SBarry Smith PetscFunctionBegin; 14639566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14649566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14665c897100SBarry Smith } 14675c897100SBarry Smith 1468c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146978b84d54SShri Abhyankar 1470d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1471d71ae5a4SJacob Faibussowitsch { 1472416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1473d9fead3dSBarry Smith PetscScalar *y; 147454f21887SBarry Smith const PetscScalar *x; 1475fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1476003131ecSBarry Smith PetscInt m = A->rmap->n; 14770298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14787b083b7cSBarry Smith PetscInt n, i; 1479362ced78SSatish Balay PetscScalar sum; 1480ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 148117ab2063SBarry Smith 1482b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 148397952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1484fee21e36SBarry Smith #endif 1485fee21e36SBarry Smith 14863a40ed3dSBarry Smith PetscFunctionBegin; 1487b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14889566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1490b215bc84SStefano Zampini } 14919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14929566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14939566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1494416022c9SBarry Smith ii = a->i; 14954eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149797952fefSHong Zhang m = a->compressedrow.nrows; 149897952fefSHong Zhang ii = a->compressedrow.i; 149997952fefSHong Zhang ridx = a->compressedrow.rindex; 150097952fefSHong Zhang for (i = 0; i < m; i++) { 150197952fefSHong Zhang n = ii[i + 1] - ii[i]; 150297952fefSHong Zhang aj = a->j + ii[i]; 1503fff043a9SJunchao Zhang aa = a_a + ii[i]; 150497952fefSHong Zhang sum = 0.0; 1505003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1506003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150797952fefSHong Zhang y[*ridx++] = sum; 150897952fefSHong Zhang } 150997952fefSHong Zhang } else { /* do not use compressed row format */ 1510b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15113d3eaba7SBarry Smith aj = a->j; 1512fff043a9SJunchao Zhang aa = a_a; 1513b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1514b05257ddSBarry Smith #else 151517ab2063SBarry Smith for (i = 0; i < m; i++) { 1516003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1517003131ecSBarry Smith aj = a->j + ii[i]; 1518fff043a9SJunchao Zhang aa = a_a + ii[i]; 151917ab2063SBarry Smith sum = 0.0; 1520003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 152117ab2063SBarry Smith y[i] = sum; 152217ab2063SBarry Smith } 15238d195f9aSBarry Smith #endif 1524b05257ddSBarry Smith } 15259566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15269566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15279566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 153017ab2063SBarry Smith } 153117ab2063SBarry Smith 1532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1533d71ae5a4SJacob Faibussowitsch { 1534b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1535b434eb95SMatthew G. Knepley PetscScalar *y; 1536b434eb95SMatthew G. Knepley const PetscScalar *x; 1537fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1538b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1539b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1540b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1541b434eb95SMatthew G. Knepley PetscScalar sum; 1542b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1543b434eb95SMatthew G. Knepley 1544b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1545b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1546b434eb95SMatthew G. Knepley #endif 1547b434eb95SMatthew G. Knepley 1548b434eb95SMatthew G. Knepley PetscFunctionBegin; 15499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15509566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15519566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1552b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1553b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1554b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1555b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1556b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1557b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1558b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1559fff043a9SJunchao Zhang aa = a_a + ii[i]; 1560b434eb95SMatthew G. Knepley sum = 0.0; 1561b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1562b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1563b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1564b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1565b434eb95SMatthew G. Knepley } 1566b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15673d3eaba7SBarry Smith ii = a->i; 1568b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1569b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1570b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1571fff043a9SJunchao Zhang aa = a_a + ii[i]; 1572b434eb95SMatthew G. Knepley sum = 0.0; 1573b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1574b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1575b434eb95SMatthew G. Knepley y[i] = sum; 1576b434eb95SMatthew G. Knepley } 1577b434eb95SMatthew G. Knepley } 15789566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15809566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1583b434eb95SMatthew G. Knepley } 1584b434eb95SMatthew G. Knepley 1585d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1586d71ae5a4SJacob Faibussowitsch { 1587b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1588b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1589b434eb95SMatthew G. Knepley const PetscScalar *x; 1590fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1591b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1592b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1593b434eb95SMatthew G. Knepley PetscScalar sum; 1594b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1595b434eb95SMatthew G. Knepley 1596b434eb95SMatthew G. Knepley PetscFunctionBegin; 15979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15989566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15999566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1600b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 160148a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1602b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1603b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1604b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1605b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1606b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1607b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1608fff043a9SJunchao Zhang aa = a_a + ii[i]; 1609b434eb95SMatthew G. Knepley sum = y[*ridx]; 1610b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1611b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1612b434eb95SMatthew G. Knepley } 1613b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16143d3eaba7SBarry Smith ii = a->i; 1615b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1616b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1617b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1618fff043a9SJunchao Zhang aa = a_a + ii[i]; 1619b434eb95SMatthew G. Knepley sum = y[i]; 1620b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1621b434eb95SMatthew G. Knepley z[i] = sum; 1622b434eb95SMatthew G. Knepley } 1623b434eb95SMatthew G. Knepley } 16249566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16269566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1629b434eb95SMatthew G. Knepley } 1630b434eb95SMatthew G. Knepley 1631c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1632d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1633d71ae5a4SJacob Faibussowitsch { 1634416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1635f15663dcSBarry Smith PetscScalar *y, *z; 1636f15663dcSBarry Smith const PetscScalar *x; 1637fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1638d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1639d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1640362ced78SSatish Balay PetscScalar sum; 1641ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16429ea0dfa2SSatish Balay 16433a40ed3dSBarry Smith PetscFunctionBegin; 1644b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16459566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1647b215bc84SStefano Zampini } 16489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16499566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16509566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16514eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 165248a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 165397952fefSHong Zhang m = a->compressedrow.nrows; 165497952fefSHong Zhang ii = a->compressedrow.i; 165597952fefSHong Zhang ridx = a->compressedrow.rindex; 165697952fefSHong Zhang for (i = 0; i < m; i++) { 165797952fefSHong Zhang n = ii[i + 1] - ii[i]; 165897952fefSHong Zhang aj = a->j + ii[i]; 1659fff043a9SJunchao Zhang aa = a_a + ii[i]; 166097952fefSHong Zhang sum = y[*ridx]; 1661f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166297952fefSHong Zhang z[*ridx++] = sum; 166397952fefSHong Zhang } 166497952fefSHong Zhang } else { /* do not use compressed row format */ 16653d3eaba7SBarry Smith ii = a->i; 1666f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16673d3eaba7SBarry Smith aj = a->j; 1668fff043a9SJunchao Zhang aa = a_a; 1669f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1670f15663dcSBarry Smith #else 167117ab2063SBarry Smith for (i = 0; i < m; i++) { 1672f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1673f15663dcSBarry Smith aj = a->j + ii[i]; 1674fff043a9SJunchao Zhang aa = a_a + ii[i]; 167517ab2063SBarry Smith sum = y[i]; 1676f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167717ab2063SBarry Smith z[i] = sum; 167817ab2063SBarry Smith } 167902ab625aSSatish Balay #endif 1680f15663dcSBarry Smith } 16819566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16829566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168617ab2063SBarry Smith } 168717ab2063SBarry Smith 168817ab2063SBarry Smith /* 168917ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 169017ab2063SBarry Smith */ 1691d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1692d71ae5a4SJacob Faibussowitsch { 1693416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1694d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1695c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169617ab2063SBarry Smith 16973a40ed3dSBarry Smith PetscFunctionBegin; 169809f38230SBarry Smith if (!a->diag) { 16999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1700c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 170109f38230SBarry Smith } 1702d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1703c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1704c0c07093SJunchao Zhang if (alreadySet) { 1705c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1706c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1707c0c07093SJunchao Zhang } 1708c0c07093SJunchao Zhang 170909f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1710bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1711bfeeae90SHong Zhang if (a->j[j] == i) { 171209f38230SBarry Smith a->diag[i] = j; 171317ab2063SBarry Smith break; 171417ab2063SBarry Smith } 171517ab2063SBarry Smith } 171617ab2063SBarry Smith } 17173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171817ab2063SBarry Smith } 171917ab2063SBarry Smith 1720d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1721d71ae5a4SJacob Faibussowitsch { 172261ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 172361ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 172461ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172561ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172661ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172761ecd0c6SBarry Smith 172861ecd0c6SBarry Smith PetscFunctionBegin; 172961ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17319566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 173361ecd0c6SBarry Smith } 173461ecd0c6SBarry Smith 173561ecd0c6SBarry Smith if (a->diagonaldense) { 173661ecd0c6SBarry Smith cnt = 0; 173761ecd0c6SBarry Smith } else { 17389566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1740349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 174161ecd0c6SBarry Smith cnt++; 174261ecd0c6SBarry Smith mdiag[i] = 1; 174361ecd0c6SBarry Smith } 174461ecd0c6SBarry Smith } 174561ecd0c6SBarry Smith } 174661ecd0c6SBarry Smith if (!cnt) { 17479566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174861ecd0c6SBarry Smith } else { 1749b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1750b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 175161ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 175261ecd0c6SBarry Smith 175361ecd0c6SBarry Smith a->a = NULL; 175461ecd0c6SBarry Smith a->j = NULL; 175561ecd0c6SBarry Smith a->i = NULL; 175661ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1757ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175961ecd0c6SBarry Smith 176061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176161ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17629566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176348a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1764447d62f5SStefano Zampini } 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17669566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176761ecd0c6SBarry Smith if (singlemalloc) { 17689566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176961ecd0c6SBarry Smith } else { 17709566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17719566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17729566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177361ecd0c6SBarry Smith } 177461ecd0c6SBarry Smith } 17759566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177661ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177861ecd0c6SBarry Smith } 177961ecd0c6SBarry Smith 1780be5855fcSBarry Smith /* 1781be5855fcSBarry Smith Checks for missing diagonals 1782be5855fcSBarry Smith */ 1783d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1784d71ae5a4SJacob Faibussowitsch { 1785be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17867734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1787be5855fcSBarry Smith 1788be5855fcSBarry Smith PetscFunctionBegin; 178909f38230SBarry Smith *missing = PETSC_FALSE; 17907734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179109f38230SBarry Smith *missing = PETSC_TRUE; 179209f38230SBarry Smith if (d) *d = 0; 17939566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179409f38230SBarry Smith } else { 179501445905SHong Zhang PetscInt n; 179601445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1797f1e2ffcdSBarry Smith diag = a->diag; 179801445905SHong Zhang for (i = 0; i < n; i++) { 17997734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 180009f38230SBarry Smith *missing = PETSC_TRUE; 180109f38230SBarry Smith if (d) *d = i; 18029566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1803358d2f5dSShri Abhyankar break; 180409f38230SBarry Smith } 1805be5855fcSBarry Smith } 1806be5855fcSBarry Smith } 18073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1808be5855fcSBarry Smith } 1809be5855fcSBarry Smith 18100da83c2eSBarry Smith #include <petscblaslapack.h> 18110da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18120da83c2eSBarry Smith 18130da83c2eSBarry Smith /* 18140da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18150da83c2eSBarry Smith */ 1816d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1817d71ae5a4SJacob Faibussowitsch { 18180da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18190da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18200da83c2eSBarry Smith const PetscReal shift = 0.0; 18210da83c2eSBarry Smith PetscInt ipvt[5]; 18224e208921SJed Brown PetscCount flops = 0; 18230da83c2eSBarry Smith PetscScalar work[25], *v_work; 18240da83c2eSBarry Smith 18250da83c2eSBarry Smith PetscFunctionBegin; 18260da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18270da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182808401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1829ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 183148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18320da83c2eSBarry Smith ncnt = 0; 18330da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18340da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18359566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18360da83c2eSBarry Smith switch (bsizes[i]) { 1837d71ae5a4SJacob Faibussowitsch case 1: 1838d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1839d71ae5a4SJacob Faibussowitsch break; 18400da83c2eSBarry Smith case 2: 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18420da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18440da83c2eSBarry Smith break; 18450da83c2eSBarry Smith case 3: 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18470da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18490da83c2eSBarry Smith break; 18500da83c2eSBarry Smith case 4: 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18520da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18540da83c2eSBarry Smith break; 18550da83c2eSBarry Smith case 5: 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18570da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18590da83c2eSBarry Smith break; 18600da83c2eSBarry Smith case 6: 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18620da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18640da83c2eSBarry Smith break; 18650da83c2eSBarry Smith case 7: 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18670da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18689566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18690da83c2eSBarry Smith break; 18700da83c2eSBarry Smith default: 18719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18720da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18739566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18740da83c2eSBarry Smith } 18750da83c2eSBarry Smith ncnt += bsizes[i]; 18760da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18774e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18780da83c2eSBarry Smith } 18793ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 188048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18819566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18830da83c2eSBarry Smith } 18840da83c2eSBarry Smith 1885422a814eSBarry Smith /* 1886422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1887422a814eSBarry Smith */ 1888d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1889d71ae5a4SJacob Faibussowitsch { 189071f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1891d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18922e5835c6SStefano Zampini const MatScalar *v; 189354f21887SBarry Smith PetscScalar *idiag, *mdiag; 189471f1c65dSBarry Smith 189571f1c65dSBarry Smith PetscFunctionBegin; 18963ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18979566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189871f1c65dSBarry Smith diag = a->diag; 18994dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 19002e5835c6SStefano Zampini 190171f1c65dSBarry Smith mdiag = a->mdiag; 190271f1c65dSBarry Smith idiag = a->idiag; 19039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1904422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190571f1c65dSBarry Smith for (i = 0; i < m; i++) { 190671f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1907899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1908899639b0SHong Zhang if (PetscRealPart(fshift)) { 19099566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19107b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19117b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19127b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191398921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1914899639b0SHong Zhang } 191571f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191671f1c65dSBarry Smith } 19179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191871f1c65dSBarry Smith } else { 191971f1c65dSBarry Smith for (i = 0; i < m; i++) { 192071f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192171f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192271f1c65dSBarry Smith } 19239566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192471f1c65dSBarry Smith } 192571f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192871f1c65dSBarry Smith } 192971f1c65dSBarry Smith 1930c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1931d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1932d71ae5a4SJacob Faibussowitsch { 1933416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1934e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19352e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193654f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19373d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193897f1f81fSBarry Smith const PetscInt *idx, *diag; 193917ab2063SBarry Smith 19403a40ed3dSBarry Smith PetscFunctionBegin; 1941b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19429566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1944b215bc84SStefano Zampini } 1945b965ef7fSBarry Smith its = its * lits; 194691723122SBarry Smith 194771f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19489566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194971f1c65dSBarry Smith a->fshift = fshift; 195071f1c65dSBarry Smith a->omega = omega; 1951ed480e8bSBarry Smith 195271f1c65dSBarry Smith diag = a->diag; 195371f1c65dSBarry Smith t = a->ssor_work; 1954ed480e8bSBarry Smith idiag = a->idiag; 195571f1c65dSBarry Smith mdiag = a->mdiag; 1956ed480e8bSBarry Smith 19579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19589566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19599566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1960ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 196117ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196217ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1963ed480e8bSBarry Smith bs = b; 196417ab2063SBarry Smith for (i = 0; i < m; i++) { 196571f1c65dSBarry Smith d = fshift + mdiag[i]; 1966416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1967ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19682e5835c6SStefano Zampini v = aa + diag[i] + 1; 196917ab2063SBarry Smith sum = b[i] * d / omega; 1970003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 197117ab2063SBarry Smith x[i] = sum; 197217ab2063SBarry Smith } 19739566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19749566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197817ab2063SBarry Smith } 1979c783ea89SBarry Smith 198008401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1981f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19824c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1983887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198417ab2063SBarry Smith 198517ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198617ab2063SBarry Smith 1987887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198817ab2063SBarry Smith */ 198917ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 199017ab2063SBarry Smith 199117ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199217ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1993416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1994ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19952e5835c6SStefano Zampini v = aa + diag[i] + 1; 199617ab2063SBarry Smith sum = b[i]; 1997e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1998ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199917ab2063SBarry Smith } 200017ab2063SBarry Smith 200117ab2063SBarry Smith /* t = b - (2*E - D)x */ 20022e5835c6SStefano Zampini v = aa; 20032205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200417ab2063SBarry Smith 200517ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2006ed480e8bSBarry Smith ts = t; 2007416022c9SBarry Smith diag = a->diag; 200817ab2063SBarry Smith for (i = 0; i < m; i++) { 2009416022c9SBarry Smith n = diag[i] - a->i[i]; 2010ed480e8bSBarry Smith idx = a->j + a->i[i]; 20112e5835c6SStefano Zampini v = aa + a->i[i]; 201217ab2063SBarry Smith sum = t[i]; 2013003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2014ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2015733d66baSBarry Smith /* x = x + t */ 2016733d66baSBarry Smith x[i] += t[i]; 201717ab2063SBarry Smith } 201817ab2063SBarry Smith 20199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202317ab2063SBarry Smith } 202417ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202517ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202617ab2063SBarry Smith for (i = 0; i < m; i++) { 2027416022c9SBarry Smith n = diag[i] - a->i[i]; 2028ed480e8bSBarry Smith idx = a->j + a->i[i]; 20292e5835c6SStefano Zampini v = aa + a->i[i]; 203017ab2063SBarry Smith sum = b[i]; 2031e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20325c99c7daSBarry Smith t[i] = sum; 2033ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203417ab2063SBarry Smith } 20355c99c7daSBarry Smith xb = t; 20369566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20373a40ed3dSBarry Smith } else xb = b; 203817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2040416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2041ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20422e5835c6SStefano Zampini v = aa + diag[i] + 1; 204317ab2063SBarry Smith sum = xb[i]; 2044e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20455c99c7daSBarry Smith if (xb == b) { 2046ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20475c99c7daSBarry Smith } else { 2048b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204917ab2063SBarry Smith } 20505c99c7daSBarry Smith } 20519566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205217ab2063SBarry Smith } 205317ab2063SBarry Smith its--; 205417ab2063SBarry Smith } 205517ab2063SBarry Smith while (its--) { 205617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205717ab2063SBarry Smith for (i = 0; i < m; i++) { 2058b19a5dc2SMark Adams /* lower */ 2059b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2060ed480e8bSBarry Smith idx = a->j + a->i[i]; 20612e5835c6SStefano Zampini v = aa + a->i[i]; 206217ab2063SBarry Smith sum = b[i]; 2063e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2064b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2065b19a5dc2SMark Adams /* upper */ 2066b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2067b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20682e5835c6SStefano Zampini v = aa + diag[i] + 1; 2069b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2070b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207117ab2063SBarry Smith } 2072b19a5dc2SMark Adams xb = t; 20739566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2074b19a5dc2SMark Adams } else xb = b; 207517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2077b19a5dc2SMark Adams sum = xb[i]; 2078b19a5dc2SMark Adams if (xb == b) { 2079b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2080416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2081ed480e8bSBarry Smith idx = a->j + a->i[i]; 20822e5835c6SStefano Zampini v = aa + a->i[i]; 2083e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2084ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2085b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2086b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2087b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20882e5835c6SStefano Zampini v = aa + diag[i] + 1; 2089b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2090b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 209117ab2063SBarry Smith } 2092b19a5dc2SMark Adams } 2093b19a5dc2SMark Adams if (xb == b) { 20949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2095b19a5dc2SMark Adams } else { 20969566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2097b19a5dc2SMark Adams } 209817ab2063SBarry Smith } 209917ab2063SBarry Smith } 21009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 21019566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 21029566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210417ab2063SBarry Smith } 210517ab2063SBarry Smith 2106d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2107d71ae5a4SJacob Faibussowitsch { 2108416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21094e220ebcSLois Curfman McInnes 21103a40ed3dSBarry Smith PetscFunctionBegin; 21114e220ebcSLois Curfman McInnes info->block_size = 1.0; 21123966268fSBarry Smith info->nz_allocated = a->maxnz; 21133966268fSBarry Smith info->nz_used = a->nz; 21143966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21153966268fSBarry Smith info->assemblies = A->num_ass; 21163966268fSBarry Smith info->mallocs = A->info.mallocs; 21174dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2118d5f3da31SBarry Smith if (A->factortype) { 21194e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21204e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21214e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21224e220ebcSLois Curfman McInnes } else { 21234e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21244e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21254e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21264e220ebcSLois Curfman McInnes } 21273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212817ab2063SBarry Smith } 212917ab2063SBarry Smith 2130d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2131d71ae5a4SJacob Faibussowitsch { 2132416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2133c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213497b48c8fSBarry Smith const PetscScalar *xx; 21352e5835c6SStefano Zampini PetscScalar *bb, *aa; 2136c7da8527SEric Chamberland PetscInt d = 0; 213717ab2063SBarry Smith 21383a40ed3dSBarry Smith PetscFunctionBegin; 213997b48c8fSBarry Smith if (x && b) { 21409566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21419566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 214297b48c8fSBarry Smith for (i = 0; i < N; i++) { 2143aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2144447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214597b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214697b48c8fSBarry Smith } 21479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214997b48c8fSBarry Smith } 215097b48c8fSBarry Smith 21519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2152a9817697SBarry Smith if (a->keepnonzeropattern) { 2153f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2154aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21559566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2156f1e2ffcdSBarry Smith } 2157f4df32b1SMatthew Knepley if (diag != 0.0) { 2158c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2159c7da8527SEric Chamberland d = rows[i]; 2160447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216108401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2162c7da8527SEric Chamberland } 2163f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2164447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21652e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2166f1e2ffcdSBarry Smith } 2167f1e2ffcdSBarry Smith } 2168f1e2ffcdSBarry Smith } else { 2169f4df32b1SMatthew Knepley if (diag != 0.0) { 217017ab2063SBarry Smith for (i = 0; i < N; i++) { 2171aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21727ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2173447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2174447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2175447d62f5SStefano Zampini } else { 2176416022c9SBarry Smith a->ilen[rows[i]] = 1; 21772e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2178bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2179447d62f5SStefano Zampini } 2180447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21819566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 218217ab2063SBarry Smith } 218317ab2063SBarry Smith } 21843a40ed3dSBarry Smith } else { 218517ab2063SBarry Smith for (i = 0; i < N; i++) { 2186aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2187416022c9SBarry Smith a->ilen[rows[i]] = 0; 218817ab2063SBarry Smith } 218917ab2063SBarry Smith } 2190e56f5c9eSBarry Smith A->nonzerostate++; 2191f1e2ffcdSBarry Smith } 21929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2193dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219517ab2063SBarry Smith } 219617ab2063SBarry Smith 2197d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2198d71ae5a4SJacob Faibussowitsch { 21996e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22006e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 22012b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 22026e169961SBarry Smith const PetscScalar *xx; 22032e5835c6SStefano Zampini PetscScalar *bb, *aa; 22046e169961SBarry Smith 22056e169961SBarry Smith PetscFunctionBegin; 22063ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22086e169961SBarry Smith if (x && b) { 22099566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22109566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22112b40b63fSBarry Smith vecs = PETSC_TRUE; 22126e169961SBarry Smith } 22139566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22146e169961SBarry Smith for (i = 0; i < N; i++) { 2215aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22169566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 22172205254eSKarl Rupp 22186e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22196e169961SBarry Smith } 22206e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22216e169961SBarry Smith if (!zeroed[i]) { 22226e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22234cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22242e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22252e5835c6SStefano Zampini aa[j] = 0.0; 22266e169961SBarry Smith } 22276e169961SBarry Smith } 22284cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22296e169961SBarry Smith } 22306e169961SBarry Smith if (x && b) { 22319566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22329566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22336e169961SBarry Smith } 22349566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22356e169961SBarry Smith if (diag != 0.0) { 22369566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22371d5a398dSstefano_zampini if (missing) { 22381d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22394cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2240aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22419566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22421d5a398dSstefano_zampini } 22431d5a398dSstefano_zampini } else { 2244ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22456e169961SBarry Smith } 22461d5a398dSstefano_zampini } 22479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2248dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22506e169961SBarry Smith } 22516e169961SBarry Smith 2252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2253d71ae5a4SJacob Faibussowitsch { 2254fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2255fff043a9SJunchao Zhang const PetscScalar *aa; 2256fff043a9SJunchao Zhang PetscInt *itmp; 225717ab2063SBarry Smith 22583a40ed3dSBarry Smith PetscFunctionBegin; 22599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2260416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22612e5835c6SStefano Zampini if (v) *v = (PetscScalar *)(aa + a->i[row]); 226217ab2063SBarry Smith if (idx) { 2263bfeeae90SHong Zhang itmp = a->j + a->i[row]; 226426fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2265f4259b30SLisandro Dalcin else *idx = NULL; 226617ab2063SBarry Smith } 22679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226917ab2063SBarry Smith } 227017ab2063SBarry Smith 2271d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2272d71ae5a4SJacob Faibussowitsch { 22733a40ed3dSBarry Smith PetscFunctionBegin; 2274cb4a9cd9SHong Zhang if (nz) *nz = 0; 22752e5835c6SStefano Zampini if (idx) *idx = NULL; 22762e5835c6SStefano Zampini if (v) *v = NULL; 22773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227817ab2063SBarry Smith } 227917ab2063SBarry Smith 2280d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2281d71ae5a4SJacob Faibussowitsch { 2282416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22832e5835c6SStefano Zampini const MatScalar *v; 228436db0b34SBarry Smith PetscReal sum = 0.0; 228597f1f81fSBarry Smith PetscInt i, j; 228617ab2063SBarry Smith 22873a40ed3dSBarry Smith PetscFunctionBegin; 22889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228917ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2290570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2291570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2292792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2293570b7f6dSBarry Smith #else 2294416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22959371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22969371c9d4SSatish Balay v++; 229717ab2063SBarry Smith } 22988f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2299570b7f6dSBarry Smith #endif 23009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 23013a40ed3dSBarry Smith } else if (type == NORM_1) { 230236db0b34SBarry Smith PetscReal *tmp; 230397f1f81fSBarry Smith PetscInt *jj = a->j; 23049566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2305064f8208SBarry Smith *nrm = 0.0; 2306416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23079371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23089371c9d4SSatish Balay v++; 230917ab2063SBarry Smith } 2310d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2311064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 231217ab2063SBarry Smith } 23139566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23153a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2316064f8208SBarry Smith *nrm = 0.0; 2317d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23182e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 231917ab2063SBarry Smith sum = 0.0; 2320416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23219371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23229371c9d4SSatish Balay v2++; 232317ab2063SBarry Smith } 2324064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 232517ab2063SBarry Smith } 23269566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2327f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 233017ab2063SBarry Smith } 233117ab2063SBarry Smith 2332d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2333d71ae5a4SJacob Faibussowitsch { 23343d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 233554f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23362e5835c6SStefano Zampini const MatScalar *va, *vb; 233797f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2338cd0d46ebSvictorle 2339cd0d46ebSvictorle PetscFunctionBegin; 23409566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23419566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23425485867bSBarry Smith if (ma != nb || na != mb) { 23435485867bSBarry Smith *f = PETSC_FALSE; 23443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23455485867bSBarry Smith } 23469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23489371c9d4SSatish Balay aii = aij->i; 23499371c9d4SSatish Balay bii = bij->i; 23509371c9d4SSatish Balay adx = aij->j; 23519371c9d4SSatish Balay bdx = bij->j; 23529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2354cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2355cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2356cd0d46ebSvictorle 2357cd0d46ebSvictorle *f = PETSC_TRUE; 2358cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2359cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 236097f1f81fSBarry Smith PetscInt idc, idr; 23615485867bSBarry Smith PetscScalar vc, vr; 2362cd0d46ebSvictorle /* column/row index/value */ 23635485867bSBarry Smith idc = adx[aptr[i]]; 23645485867bSBarry Smith idr = bdx[bptr[idc]]; 23655485867bSBarry Smith vc = va[aptr[i]]; 23665485867bSBarry Smith vr = vb[bptr[idc]]; 23675485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23685485867bSBarry Smith *f = PETSC_FALSE; 23695485867bSBarry Smith goto done; 2370cd0d46ebSvictorle } else { 23715485867bSBarry Smith aptr[i]++; 23725485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2373cd0d46ebSvictorle } 2374cd0d46ebSvictorle } 2375cd0d46ebSvictorle } 2376cd0d46ebSvictorle done: 23779566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23789566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2382cd0d46ebSvictorle } 2383cd0d46ebSvictorle 2384d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2385d71ae5a4SJacob Faibussowitsch { 23863d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238754f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238854f21887SBarry Smith MatScalar *va, *vb; 23891cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23901cbb95d3SBarry Smith 23911cbb95d3SBarry Smith PetscFunctionBegin; 23929566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23939566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23941cbb95d3SBarry Smith if (ma != nb || na != mb) { 23951cbb95d3SBarry Smith *f = PETSC_FALSE; 23963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23971cbb95d3SBarry Smith } 23989371c9d4SSatish Balay aii = aij->i; 23999371c9d4SSatish Balay bii = bij->i; 24009371c9d4SSatish Balay adx = aij->j; 24019371c9d4SSatish Balay bdx = bij->j; 24029371c9d4SSatish Balay va = aij->a; 24039371c9d4SSatish Balay vb = bij->a; 24049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 24059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 24061cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24071cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24081cbb95d3SBarry Smith 24091cbb95d3SBarry Smith *f = PETSC_TRUE; 24101cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24111cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24121cbb95d3SBarry Smith PetscInt idc, idr; 24131cbb95d3SBarry Smith PetscScalar vc, vr; 24141cbb95d3SBarry Smith /* column/row index/value */ 24151cbb95d3SBarry Smith idc = adx[aptr[i]]; 24161cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24171cbb95d3SBarry Smith vc = va[aptr[i]]; 24181cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24191cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24201cbb95d3SBarry Smith *f = PETSC_FALSE; 24211cbb95d3SBarry Smith goto done; 24221cbb95d3SBarry Smith } else { 24231cbb95d3SBarry Smith aptr[i]++; 24241cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24251cbb95d3SBarry Smith } 24261cbb95d3SBarry Smith } 24271cbb95d3SBarry Smith } 24281cbb95d3SBarry Smith done: 24299566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24309566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24321cbb95d3SBarry Smith } 24331cbb95d3SBarry Smith 2434d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2435d71ae5a4SJacob Faibussowitsch { 24369e29f15eSvictorle PetscFunctionBegin; 24379566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24399e29f15eSvictorle } 24409e29f15eSvictorle 2441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2442d71ae5a4SJacob Faibussowitsch { 24431cbb95d3SBarry Smith PetscFunctionBegin; 24449566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24461cbb95d3SBarry Smith } 24471cbb95d3SBarry Smith 2448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2449d71ae5a4SJacob Faibussowitsch { 2450416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2451fff8e43fSBarry Smith const PetscScalar *l, *r; 2452fff8e43fSBarry Smith PetscScalar x; 245354f21887SBarry Smith MatScalar *v; 2454fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2455fff8e43fSBarry Smith const PetscInt *jj; 245617ab2063SBarry Smith 24573a40ed3dSBarry Smith PetscFunctionBegin; 245817ab2063SBarry Smith if (ll) { 24593ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24603ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 246208401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24639566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 246517ab2063SBarry Smith for (i = 0; i < m; i++) { 246617ab2063SBarry Smith x = l[i]; 2467416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24682205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 246917ab2063SBarry Smith } 24709566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 247317ab2063SBarry Smith } 247417ab2063SBarry Smith if (rr) { 24759566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 247608401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24779566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24792e5835c6SStefano Zampini jj = a->j; 24802205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24829566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24839566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 248417ab2063SBarry Smith } 24859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 248717ab2063SBarry Smith } 248817ab2063SBarry Smith 2489d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2490d71ae5a4SJacob Faibussowitsch { 2491db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2492d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 249397f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24945d0c19d7SBarry Smith const PetscInt *irow, *icol; 24952e5835c6SStefano Zampini const PetscScalar *aa; 24965d0c19d7SBarry Smith PetscInt nrows, ncols; 249797f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2498fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2499416022c9SBarry Smith Mat C; 2500cdc6f3adSToby Isaac PetscBool stride; 250117ab2063SBarry Smith 25023a40ed3dSBarry Smith PetscFunctionBegin; 25039566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 25049566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 25059566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 250617ab2063SBarry Smith 25079566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2508ff718158SBarry Smith if (stride) { 25099566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2510ff718158SBarry Smith } else { 2511ff718158SBarry Smith first = 0; 2512ff718158SBarry Smith step = 0; 2513ff718158SBarry Smith } 2514fee21e36SBarry Smith if (stride && step == 1) { 251502834360SBarry Smith /* special case of contiguous rows */ 25169566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 251702834360SBarry Smith /* loop over new rows determining lens and starting points */ 251802834360SBarry Smith for (i = 0; i < nrows; i++) { 2519bfeeae90SHong Zhang kstart = ai[irow[i]]; 2520a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2521a91a9bebSLisandro Dalcin starts[i] = kstart; 252202834360SBarry Smith for (k = kstart; k < kend; k++) { 2523bfeeae90SHong Zhang if (aj[k] >= first) { 252402834360SBarry Smith starts[i] = k; 252502834360SBarry Smith break; 252602834360SBarry Smith } 252702834360SBarry Smith } 2528a2744918SBarry Smith sum = 0; 252902834360SBarry Smith while (k < kend) { 2530bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2531a2744918SBarry Smith sum++; 253202834360SBarry Smith } 2533a2744918SBarry Smith lens[i] = sum; 253402834360SBarry Smith } 253502834360SBarry Smith /* create submatrix */ 2536cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 253797f1f81fSBarry Smith PetscInt n_cols, n_rows; 25389566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2539aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25409566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 254108480c60SBarry Smith C = *B; 25423a40ed3dSBarry Smith } else { 25433bef6203SJed Brown PetscInt rbs, cbs; 25449566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25459566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25469566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25479566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25489566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25499566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 255108480c60SBarry Smith } 2552db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2553db02288aSLois Curfman McInnes 255402834360SBarry Smith /* loop over rows inserting into submatrix */ 2555fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2556db02288aSLois Curfman McInnes j_new = c->j; 2557db02288aSLois Curfman McInnes i_new = c->i; 25589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 255902834360SBarry Smith for (i = 0; i < nrows; i++) { 2560a2744918SBarry Smith ii = starts[i]; 2561a2744918SBarry Smith lensi = lens[i]; 2562ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2564a2744918SBarry Smith a_new += lensi; 2565a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2566a2744918SBarry Smith c->ilen[i] = lensi; 256702834360SBarry Smith } 2568fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25709566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25713a40ed3dSBarry Smith } else { 25729566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25739566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25754dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25766bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25774dcab191SBarry Smith smap[icol[i]] = i + 1; 25784dcab191SBarry Smith } 25794dcab191SBarry Smith 258002834360SBarry Smith /* determine lens of each row */ 258102834360SBarry Smith for (i = 0; i < nrows; i++) { 2582bfeeae90SHong Zhang kstart = ai[irow[i]]; 258302834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 258402834360SBarry Smith lens[i] = 0; 258502834360SBarry Smith for (k = kstart; k < kend; k++) { 2586ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 258702834360SBarry Smith } 258802834360SBarry Smith } 258917ab2063SBarry Smith /* Create and fill new matrix */ 2590a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2591ace3abfcSBarry Smith PetscBool equal; 25920f5bd95cSBarry Smith 259399141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2594aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25959566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 259628b400f6SJacob Faibussowitsch PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros"); 25979566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 259808480c60SBarry Smith C = *B; 25993a40ed3dSBarry Smith } else { 26003bef6203SJed Brown PetscInt rbs, cbs; 26019566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 26029566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 26039566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 26049566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 26059566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 26069566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 26079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 260808480c60SBarry Smith } 26099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2610fb3c7e2dSJunchao Zhang 261199141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2612fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 261317ab2063SBarry Smith for (i = 0; i < nrows; i++) { 261499141d43SSatish Balay row = irow[i]; 2615bfeeae90SHong Zhang kstart = ai[row]; 261699141d43SSatish Balay kend = kstart + a->ilen[row]; 2617bfeeae90SHong Zhang mat_i = c->i[i]; 261899141d43SSatish Balay mat_j = c->j + mat_i; 2619fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 262099141d43SSatish Balay mat_ilen = c->ilen + i; 262117ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2622bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2623ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26242e5835c6SStefano Zampini *mat_a++ = aa[k]; 262599141d43SSatish Balay (*mat_ilen)++; 262617ab2063SBarry Smith } 262717ab2063SBarry Smith } 262817ab2063SBarry Smith } 26299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 263002834360SBarry Smith /* Free work space */ 26319566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26329566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26339566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2634cdc6f3adSToby Isaac /* sort */ 2635cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2636cdc6f3adSToby Isaac PetscInt ilen; 2637cdc6f3adSToby Isaac 2638cdc6f3adSToby Isaac mat_i = c->i[i]; 2639cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2640fb3c7e2dSJunchao Zhang mat_a = c_a + mat_i; 2641cdc6f3adSToby Isaac ilen = c->ilen[i]; 26429566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2643cdc6f3adSToby Isaac } 2644fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 264502834360SBarry Smith } 26468c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26479566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2648305c6ccfSStefano Zampini #endif 26499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 265117ab2063SBarry Smith 26529566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2653416022c9SBarry Smith *B = C; 26543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265517ab2063SBarry Smith } 265617ab2063SBarry Smith 2657d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2658d71ae5a4SJacob Faibussowitsch { 265982d44351SHong Zhang Mat B; 266082d44351SHong Zhang 266182d44351SHong Zhang PetscFunctionBegin; 2662c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26639566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26649566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26659566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26669566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26679566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 266882d44351SHong Zhang *subMat = B; 2669c2d650bdSHong Zhang } else { 26709566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2671c2d650bdSHong Zhang } 26723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 267382d44351SHong Zhang } 267482d44351SHong Zhang 2675d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2676d71ae5a4SJacob Faibussowitsch { 267763b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 267863b91edcSBarry Smith Mat outA; 2679ace3abfcSBarry Smith PetscBool row_identity, col_identity; 268063b91edcSBarry Smith 26813a40ed3dSBarry Smith PetscFunctionBegin; 268208401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26831df811f5SHong Zhang 26849566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26859566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2686a871dcd8SBarry Smith 268763b91edcSBarry Smith outA = inA; 2688d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26899566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26909566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26912205254eSKarl Rupp 26929566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26942205254eSKarl Rupp 2695c3122656SLisandro Dalcin a->row = row; 26962205254eSKarl Rupp 26979566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26989566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26992205254eSKarl Rupp 2700c3122656SLisandro Dalcin a->col = col; 270163b91edcSBarry Smith 270236db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 27039566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27049566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2705f0ec6fceSSatish Balay 270694a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 270894a9d846SBarry Smith } 270963b91edcSBarry Smith 27109566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2711137fb511SHong Zhang if (row_identity && col_identity) { 27129566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2713137fb511SHong Zhang } else { 27149566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2715137fb511SHong Zhang } 27163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2717a871dcd8SBarry Smith } 2718a871dcd8SBarry Smith 2719d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2720d71ae5a4SJacob Faibussowitsch { 2721f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2722dfa0f9e5SStefano Zampini PetscScalar *v; 2723c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27243a40ed3dSBarry Smith 27253a40ed3dSBarry Smith PetscFunctionBegin; 27269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27279566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2728792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2733f0b747eeSBarry Smith } 2734f0b747eeSBarry Smith 2735d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2736d71ae5a4SJacob Faibussowitsch { 273716b64355SHong Zhang PetscInt i; 273816b64355SHong Zhang 273916b64355SHong Zhang PetscFunctionBegin; 274016b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27419566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 274216b64355SHong Zhang 274348a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27449566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 274516b64355SHong Zhang 274616b64355SHong Zhang if (submatj->rbuf1) { 27479566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 274916b64355SHong Zhang } 275016b64355SHong Zhang 275148a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27529566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27539566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 275416b64355SHong Zhang } 275516b64355SHong Zhang 275616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2757eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27589566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27599566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 276016b64355SHong Zhang #else 27619566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 276216b64355SHong Zhang #endif 276316b64355SHong Zhang 276416b64355SHong Zhang if (!submatj->allcolumns) { 276516b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2766eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 276716b64355SHong Zhang #else 27689566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 276916b64355SHong Zhang #endif 277016b64355SHong Zhang } 27719566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 277216b64355SHong Zhang 27739566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277516b64355SHong Zhang } 277616b64355SHong Zhang 2777d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2778d71ae5a4SJacob Faibussowitsch { 277916b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27805c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 278116b64355SHong Zhang 278216b64355SHong Zhang PetscFunctionBegin; 27839566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27849566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 278616b64355SHong Zhang } 278716b64355SHong Zhang 278889a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2789d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2790d71ae5a4SJacob Faibussowitsch { 27912d033e1fSHong Zhang PetscInt i; 27920fb991dcSHong Zhang Mat C; 27930fb991dcSHong Zhang Mat_SeqAIJ *c; 27940fb991dcSHong Zhang Mat_SubSppt *submatj; 27952d033e1fSHong Zhang 27962d033e1fSHong Zhang PetscFunctionBegin; 27972d033e1fSHong Zhang for (i = 0; i < n; i++) { 27980fb991dcSHong Zhang C = (*mat)[i]; 27990fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 28000fb991dcSHong Zhang submatj = c->submatis1; 28012d033e1fSHong Zhang if (submatj) { 2802682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 280326cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 28049566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28059566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28069566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28073faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 28089566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28099566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28109566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2811682e4c99SStefano Zampini } 28122d033e1fSHong Zhang } else { 28139566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28142d033e1fSHong Zhang } 28152d033e1fSHong Zhang } 281686e85357SHong Zhang 281763a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28189566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 281963a75b2aSHong Zhang 28209566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28222d033e1fSHong Zhang } 28232d033e1fSHong Zhang 2824d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2825d71ae5a4SJacob Faibussowitsch { 282697f1f81fSBarry Smith PetscInt i; 2827cddf8d76SBarry Smith 28283a40ed3dSBarry Smith PetscFunctionBegin; 282948a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2830cddf8d76SBarry Smith 283148a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2833cddf8d76SBarry Smith } 2834cddf8d76SBarry Smith 2835d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2836d71ae5a4SJacob Faibussowitsch { 2837e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28389a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28395d0c19d7SBarry Smith const PetscInt *idx; 28409a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2841f1af5d2fSBarry Smith PetscBT table; 2842bbd702dbSSatish Balay 28433a40ed3dSBarry Smith PetscFunctionBegin; 28449a88ca10SBarry Smith m = A->rmap->n / bs; 2845e4d965acSSatish Balay ai = a->i; 2846bfeeae90SHong Zhang aj = a->j; 28478a047759SSatish Balay 284808401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 284906763907SSatish Balay 28509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28519566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 285206763907SSatish Balay 2853e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2854b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2855e4d965acSSatish Balay isz = 0; 28569566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2857e4d965acSSatish Balay 2858e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28599566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28609566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2861e4d965acSSatish Balay 28629a88ca10SBarry Smith if (bs > 1) { 28639a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28649a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28659a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28669a88ca10SBarry Smith } 28679a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28689a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28699a88ca10SBarry Smith 28709a88ca10SBarry Smith k = 0; 28719a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28729a88ca10SBarry Smith n = isz; 28739a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28749a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28759a88ca10SBarry Smith row = bs * nidx[k] + ll; 28769a88ca10SBarry Smith start = ai[row]; 28779a88ca10SBarry Smith end = ai[row + 1]; 28789a88ca10SBarry Smith for (l = start; l < end; l++) { 28799a88ca10SBarry Smith val = aj[l] / bs; 28809a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28819a88ca10SBarry Smith } 28829a88ca10SBarry Smith } 28839a88ca10SBarry Smith } 28849a88ca10SBarry Smith } 28859a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28869a88ca10SBarry Smith } else { 2887dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2888e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28892205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28904dcbc457SBarry Smith } 28919566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28929566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2893e4d965acSSatish Balay 289404a348a9SBarry Smith k = 0; 289504a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 289604a348a9SBarry Smith n = isz; 289706763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2898e4d965acSSatish Balay row = nidx[k]; 2899e4d965acSSatish Balay start = ai[row]; 2900e4d965acSSatish Balay end = ai[row + 1]; 290104a348a9SBarry Smith for (l = start; l < end; l++) { 2902efb16452SHong Zhang val = aj[l]; 29032205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2904e4d965acSSatish Balay } 2905e4d965acSSatish Balay } 2906e4d965acSSatish Balay } 29079566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2908e4d965acSSatish Balay } 29099a88ca10SBarry Smith } 29109566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29119566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29134dcbc457SBarry Smith } 291417ab2063SBarry Smith 2915d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2916d71ae5a4SJacob Faibussowitsch { 29170513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29183b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29195d0c19d7SBarry Smith const PetscInt *row, *col; 29205d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 292156cd22aeSBarry Smith IS icolp, irowp; 29220298fd71SBarry Smith PetscInt *cwork = NULL; 29230298fd71SBarry Smith PetscScalar *vwork = NULL; 29240513a670SBarry Smith 29253a40ed3dSBarry Smith PetscFunctionBegin; 29269566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29279566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29289566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29299566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29300513a670SBarry Smith 29310513a670SBarry Smith /* determine lengths of permuted rows */ 29329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29332205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29349566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29359566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29369566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29379566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29399566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29400513a670SBarry Smith 29419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29420513a670SBarry Smith for (i = 0; i < m; i++) { 29439566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29442205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29459566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29469566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29470513a670SBarry Smith } 29489566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29492205254eSKarl Rupp 29503c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29512205254eSKarl Rupp 29528c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29539566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29549fe5e383SStefano Zampini #endif 29559566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29569566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29579566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29589566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29599566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29609566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 296148a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29630513a670SBarry Smith } 29640513a670SBarry Smith 2965d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2966d71ae5a4SJacob Faibussowitsch { 2967cb5b572fSBarry Smith PetscFunctionBegin; 296833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 296933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2970be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2971be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29722e5835c6SStefano Zampini const PetscScalar *aa; 2973be6bf707SBarry Smith 29749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 297508401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29769566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29779566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2979cb5b572fSBarry Smith } else { 29809566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2981cb5b572fSBarry Smith } 29823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2983cb5b572fSBarry Smith } 2984cb5b572fSBarry Smith 2985d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2986d71ae5a4SJacob Faibussowitsch { 29876c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29886e111a19SKarl Rupp 29896c0721eeSBarry Smith PetscFunctionBegin; 29906c0721eeSBarry Smith *array = a->a; 29913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29926c0721eeSBarry Smith } 29936c0721eeSBarry Smith 2994d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2995d71ae5a4SJacob Faibussowitsch { 29966c0721eeSBarry Smith PetscFunctionBegin; 2997f38c1e66SStefano Zampini *array = NULL; 29983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29996c0721eeSBarry Smith } 3000273d9f13SBarry Smith 30018229c054SShri Abhyankar /* 30028229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 30038229c054SShri Abhyankar have different nonzero structure. 30048229c054SShri Abhyankar */ 3005d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 3006d71ae5a4SJacob Faibussowitsch { 3007b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 3008ec7775f6SShri Abhyankar 3009ec7775f6SShri Abhyankar PetscFunctionBegin; 3010ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3011ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 3012b264fe52SHong Zhang const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i]; 3013b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3014b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30158af7cee1SJed Brown nnz[i] = 0; 30168af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3017b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3018b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30198af7cee1SJed Brown nnz[i]++; 30208af7cee1SJed Brown } 30218af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3022ec7775f6SShri Abhyankar } 30233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3024ec7775f6SShri Abhyankar } 3025ec7775f6SShri Abhyankar 3026d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3027d71ae5a4SJacob Faibussowitsch { 3028b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3029b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3030b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3031b264fe52SHong Zhang 3032b264fe52SHong Zhang PetscFunctionBegin; 3033b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30349566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3036b264fe52SHong Zhang } 3037b264fe52SHong Zhang 3038d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3039d71ae5a4SJacob Faibussowitsch { 3040ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3041ac90fabeSBarry Smith 3042ac90fabeSBarry Smith PetscFunctionBegin; 3043134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3044134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3045134adf20SPierre Jolivet if (e) { 30469566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 304781fa06acSBarry Smith if (e) { 30489566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3049134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 305081fa06acSBarry Smith } 305181fa06acSBarry Smith } 305254c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 305381fa06acSBarry Smith } 3054ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30552e5835c6SStefano Zampini const PetscScalar *xa; 30562e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 305781fa06acSBarry Smith PetscBLASInt one = 1, bnz; 305881fa06acSBarry Smith 30599566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3062792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30679566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3068ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30699566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3070ac90fabeSBarry Smith } else { 30718229c054SShri Abhyankar Mat B; 30728229c054SShri Abhyankar PetscInt *nnz; 30739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30749566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30759566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30769566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30779566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30789566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30809566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30819566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30829bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30839566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3084ac90fabeSBarry Smith } 30853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3086ac90fabeSBarry Smith } 3087ac90fabeSBarry Smith 3088d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3089d71ae5a4SJacob Faibussowitsch { 3090354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3091354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3092354c94deSBarry Smith PetscInt i, nz; 3093354c94deSBarry Smith PetscScalar *a; 3094354c94deSBarry Smith 3095354c94deSBarry Smith PetscFunctionBegin; 3096354c94deSBarry Smith nz = aij->nz; 30979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30982205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3100354c94deSBarry Smith #else 3101354c94deSBarry Smith PetscFunctionBegin; 3102354c94deSBarry Smith #endif 31033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3104354c94deSBarry Smith } 3105354c94deSBarry Smith 3106d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3107d71ae5a4SJacob Faibussowitsch { 3108e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3109d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3110e34fafa9SBarry Smith PetscReal atmp; 3111985db425SBarry Smith PetscScalar *x; 3112ce496241SStefano Zampini const MatScalar *aa, *av; 3113e34fafa9SBarry Smith 3114e34fafa9SBarry Smith PetscFunctionBegin; 311528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3117ce496241SStefano Zampini aa = av; 3118e34fafa9SBarry Smith ai = a->i; 3119e34fafa9SBarry Smith aj = a->j; 3120e34fafa9SBarry Smith 31219566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31229566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31239566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 312408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3125e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31269371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31279371c9d4SSatish Balay ai++; 3128e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3129985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31309371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31319371c9d4SSatish Balay x[i] = atmp; 31329371c9d4SSatish Balay if (idx) idx[i] = *aj; 31339371c9d4SSatish Balay } 31349371c9d4SSatish Balay aa++; 31359371c9d4SSatish Balay aj++; 3136985db425SBarry Smith } 3137985db425SBarry Smith } 31389566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3141985db425SBarry Smith } 3142985db425SBarry Smith 3143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3144d71ae5a4SJacob Faibussowitsch { 3145985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3146d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3147985db425SBarry Smith PetscScalar *x; 3148ce496241SStefano Zampini const MatScalar *aa, *av; 3149985db425SBarry Smith 3150985db425SBarry Smith PetscFunctionBegin; 315128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3153ce496241SStefano Zampini aa = av; 3154985db425SBarry Smith ai = a->i; 3155985db425SBarry Smith aj = a->j; 3156985db425SBarry Smith 31579566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31589566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31599566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3161985db425SBarry Smith for (i = 0; i < m; i++) { 31629371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31639371c9d4SSatish Balay ai++; 3164d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31659371c9d4SSatish Balay x[i] = *aa; 31669371c9d4SSatish Balay if (idx) idx[i] = 0; 3167985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3168985db425SBarry Smith x[i] = 0.0; 3169985db425SBarry Smith if (idx) { 3170985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3171985db425SBarry Smith if (aj[j] > j) { 3172985db425SBarry Smith idx[i] = j; 3173985db425SBarry Smith break; 3174985db425SBarry Smith } 3175985db425SBarry Smith } 31761a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31771a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3178985db425SBarry Smith } 3179985db425SBarry Smith } 3180985db425SBarry Smith for (j = 0; j < ncols; j++) { 31819371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31829371c9d4SSatish Balay x[i] = *aa; 31839371c9d4SSatish Balay if (idx) idx[i] = *aj; 31849371c9d4SSatish Balay } 31859371c9d4SSatish Balay aa++; 31869371c9d4SSatish Balay aj++; 3187985db425SBarry Smith } 3188985db425SBarry Smith } 31899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3192985db425SBarry Smith } 3193985db425SBarry Smith 3194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3195d71ae5a4SJacob Faibussowitsch { 3196c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3197c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3198ce496241SStefano Zampini PetscScalar *x; 3199ce496241SStefano Zampini const MatScalar *aa, *av; 3200c87e5d42SMatthew Knepley 3201c87e5d42SMatthew Knepley PetscFunctionBegin; 32029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3203ce496241SStefano Zampini aa = av; 3204c87e5d42SMatthew Knepley ai = a->i; 3205c87e5d42SMatthew Knepley aj = a->j; 3206c87e5d42SMatthew Knepley 32079566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32089566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32099566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321008401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3211c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32129371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32139371c9d4SSatish Balay ai++; 3214f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32159371c9d4SSatish Balay x[i] = *aa; 32169371c9d4SSatish Balay if (idx) idx[i] = 0; 3217f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3218f07e67edSHong Zhang x[i] = 0.0; 3219f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3220289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3221f07e67edSHong Zhang if (aj[j] > j) { 3222f07e67edSHong Zhang idx[i] = j; 32232205254eSKarl Rupp break; 32242205254eSKarl Rupp } 3225289a08f5SMatthew Knepley } 3226f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3227f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3228f07e67edSHong Zhang } 3229289a08f5SMatthew Knepley } 3230c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32319371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32329371c9d4SSatish Balay x[i] = *aa; 32339371c9d4SSatish Balay if (idx) idx[i] = *aj; 32349371c9d4SSatish Balay } 32359371c9d4SSatish Balay aa++; 32369371c9d4SSatish Balay aj++; 3237c87e5d42SMatthew Knepley } 3238c87e5d42SMatthew Knepley } 32399566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3242c87e5d42SMatthew Knepley } 3243c87e5d42SMatthew Knepley 3244d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3245d71ae5a4SJacob Faibussowitsch { 3246985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3247d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3248d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3249985db425SBarry Smith PetscScalar *x; 3250ce496241SStefano Zampini const MatScalar *aa, *av; 3251985db425SBarry Smith 3252985db425SBarry Smith PetscFunctionBegin; 325328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3255ce496241SStefano Zampini aa = av; 3256985db425SBarry Smith ai = a->i; 3257985db425SBarry Smith aj = a->j; 3258985db425SBarry Smith 32599566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32609566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 326208401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3263985db425SBarry Smith for (i = 0; i < m; i++) { 32649371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32659371c9d4SSatish Balay ai++; 3266d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32679371c9d4SSatish Balay x[i] = *aa; 32689371c9d4SSatish Balay if (idx) idx[i] = 0; 3269985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3270985db425SBarry Smith x[i] = 0.0; 3271985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3272985db425SBarry Smith for (j = 0; j < ncols; j++) { 3273985db425SBarry Smith if (aj[j] > j) { 3274985db425SBarry Smith idx[i] = j; 3275985db425SBarry Smith break; 3276985db425SBarry Smith } 3277985db425SBarry Smith } 3278fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3279fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3280985db425SBarry Smith } 3281985db425SBarry Smith } 3282985db425SBarry Smith for (j = 0; j < ncols; j++) { 32839371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32849371c9d4SSatish Balay x[i] = *aa; 32859371c9d4SSatish Balay if (idx) idx[i] = *aj; 32869371c9d4SSatish Balay } 32879371c9d4SSatish Balay aa++; 32889371c9d4SSatish Balay aj++; 3289e34fafa9SBarry Smith } 3290e34fafa9SBarry Smith } 32919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3294e34fafa9SBarry Smith } 3295bbead8a2SBarry Smith 3296d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3297d71ae5a4SJacob Faibussowitsch { 3298bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 329933d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3300bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33010da83c2eSBarry Smith const PetscReal shift = 0.0; 33021a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3303bbead8a2SBarry Smith 3304bbead8a2SBarry Smith PetscFunctionBegin; 3305a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33064a0d0026SBarry Smith if (a->ibdiagvalid) { 33074a0d0026SBarry Smith if (values) *values = a->ibdiag; 33083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33094a0d0026SBarry Smith } 33109566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33114dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3312bbead8a2SBarry Smith diag = a->ibdiag; 3313bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3314bbead8a2SBarry Smith /* factor and invert each block */ 3315bbead8a2SBarry Smith switch (bs) { 3316bbead8a2SBarry Smith case 1: 3317bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33189566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3319ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3320ec1892c8SHong Zhang if (allowzeropivot) { 33217b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33227b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33237b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33249566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 332598921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3326ec1892c8SHong Zhang } 3327bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3328bbead8a2SBarry Smith } 3329bbead8a2SBarry Smith break; 3330bbead8a2SBarry Smith case 2: 3331bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33329371c9d4SSatish Balay ij[0] = 2 * i; 33339371c9d4SSatish Balay ij[1] = 2 * i + 1; 33349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33367b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3338bbead8a2SBarry Smith diag += 4; 3339bbead8a2SBarry Smith } 3340bbead8a2SBarry Smith break; 3341bbead8a2SBarry Smith case 3: 3342bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33439371c9d4SSatish Balay ij[0] = 3 * i; 33449371c9d4SSatish Balay ij[1] = 3 * i + 1; 33459371c9d4SSatish Balay ij[2] = 3 * i + 2; 33469566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33487b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3350bbead8a2SBarry Smith diag += 9; 3351bbead8a2SBarry Smith } 3352bbead8a2SBarry Smith break; 3353bbead8a2SBarry Smith case 4: 3354bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33559371c9d4SSatish Balay ij[0] = 4 * i; 33569371c9d4SSatish Balay ij[1] = 4 * i + 1; 33579371c9d4SSatish Balay ij[2] = 4 * i + 2; 33589371c9d4SSatish Balay ij[3] = 4 * i + 3; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3363bbead8a2SBarry Smith diag += 16; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith case 5: 3367bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33689371c9d4SSatish Balay ij[0] = 5 * i; 33699371c9d4SSatish Balay ij[1] = 5 * i + 1; 33709371c9d4SSatish Balay ij[2] = 5 * i + 2; 33719371c9d4SSatish Balay ij[3] = 5 * i + 3; 33729371c9d4SSatish Balay ij[4] = 5 * i + 4; 33739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33757b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3377bbead8a2SBarry Smith diag += 25; 3378bbead8a2SBarry Smith } 3379bbead8a2SBarry Smith break; 3380bbead8a2SBarry Smith case 6: 3381bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33829371c9d4SSatish Balay ij[0] = 6 * i; 33839371c9d4SSatish Balay ij[1] = 6 * i + 1; 33849371c9d4SSatish Balay ij[2] = 6 * i + 2; 33859371c9d4SSatish Balay ij[3] = 6 * i + 3; 33869371c9d4SSatish Balay ij[4] = 6 * i + 4; 33879371c9d4SSatish Balay ij[5] = 6 * i + 5; 33889566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33907b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33919566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3392bbead8a2SBarry Smith diag += 36; 3393bbead8a2SBarry Smith } 3394bbead8a2SBarry Smith break; 3395bbead8a2SBarry Smith case 7: 3396bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33979371c9d4SSatish Balay ij[0] = 7 * i; 33989371c9d4SSatish Balay ij[1] = 7 * i + 1; 33999371c9d4SSatish Balay ij[2] = 7 * i + 2; 34009371c9d4SSatish Balay ij[3] = 7 * i + 3; 34019371c9d4SSatish Balay ij[4] = 7 * i + 4; 34029371c9d4SSatish Balay ij[5] = 7 * i + 5; 3403cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34067b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34079566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3408bbead8a2SBarry Smith diag += 49; 3409bbead8a2SBarry Smith } 3410bbead8a2SBarry Smith break; 3411bbead8a2SBarry Smith default: 34129566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3413bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3414ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34189566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3419bbead8a2SBarry Smith diag += bs2; 3420bbead8a2SBarry Smith } 34219566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3422bbead8a2SBarry Smith } 3423bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3425bbead8a2SBarry Smith } 3426bbead8a2SBarry Smith 3427d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3428d71ae5a4SJacob Faibussowitsch { 342973a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3430fff043a9SJunchao Zhang PetscScalar a, *aa; 343173a71a0fSBarry Smith PetscInt m, n, i, j, col; 343273a71a0fSBarry Smith 343373a71a0fSBarry Smith PetscFunctionBegin; 343473a71a0fSBarry Smith if (!x->assembled) { 34359566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 343673a71a0fSBarry Smith for (i = 0; i < m; i++) { 343773a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34389566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 343973a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34409566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 344173a71a0fSBarry Smith } 344273a71a0fSBarry Smith } 3443e2ce353bSJunchao Zhang } else { 34449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34459566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3447e2ce353bSJunchao Zhang } 34489566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 345173a71a0fSBarry Smith } 345273a71a0fSBarry Smith 3453679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3454d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3455d71ae5a4SJacob Faibussowitsch { 3456679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3457679944adSJunchao Zhang PetscScalar a; 3458679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3459679944adSJunchao Zhang 3460679944adSJunchao Zhang PetscFunctionBegin; 3461679944adSJunchao Zhang nskip = high - low; 34629566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3463679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3464679944adSJunchao Zhang for (i = 0; i < m; i++) { 3465679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34669566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3467679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3468679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34699566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3470679944adSJunchao Zhang } 3471e2ce353bSJunchao Zhang } 34729566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34739566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3475679944adSJunchao Zhang } 3476679944adSJunchao Zhang 34770a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3478cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3479cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3480cb5b572fSBarry Smith MatMult_SeqAIJ, 348197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34827c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34837c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3484f4259b30SLisandro Dalcin NULL, 3485f4259b30SLisandro Dalcin NULL, 3486f4259b30SLisandro Dalcin NULL, 3487f4259b30SLisandro Dalcin /* 10*/ NULL, 3488cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3489f4259b30SLisandro Dalcin NULL, 349041f059aeSBarry Smith MatSOR_SeqAIJ, 349191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3493cb5b572fSBarry Smith MatEqual_SeqAIJ, 3494cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3495cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3496cb5b572fSBarry Smith MatNorm_SeqAIJ, 3497f4259b30SLisandro Dalcin /* 20*/ NULL, 3498cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3499cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3500cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3501d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 350626cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3512f4259b30SLisandro Dalcin NULL, 3513f4259b30SLisandro Dalcin NULL, 3514cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3515f4259b30SLisandro Dalcin NULL, 3516d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35177dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3518cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3519cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3520cb5b572fSBarry Smith MatCopy_SeqAIJ, 3521d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3522cb5b572fSBarry Smith MatScale_SeqAIJ, 35237d68702bSBarry Smith MatShift_SeqAIJ, 352479299369SBarry Smith MatDiagonalSet_SeqAIJ, 35256e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35273b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35283b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35293b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3530a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 353193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3532f4259b30SLisandro Dalcin NULL, 3533f4259b30SLisandro Dalcin NULL, 3534cda55fadSBarry Smith MatPermute_SeqAIJ, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin /* 59*/ NULL, 3537b9b97703SBarry Smith MatDestroy_SeqAIJ, 3538b9b97703SBarry Smith MatView_SeqAIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin /* 64*/ NULL, 3542321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3547c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin /* 74*/ NULL, 35523acb8795SBarry Smith MatFDColoringApply_AIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 35566ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560bc011b1eSHong Zhang MatLoad_SeqAIJ, 3561d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35621cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin /* 89*/ NULL, 3567f4259b30SLisandro Dalcin NULL, 356826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 35718fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3572f4259b30SLisandro Dalcin NULL, 3573f4259b30SLisandro Dalcin NULL, 35746fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 35764222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3577f4259b30SLisandro Dalcin NULL, 3578f4259b30SLisandro Dalcin NULL, 357987d4246cSBarry Smith MatConjugate_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 3581d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 358299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3583f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3587f4259b30SLisandro Dalcin NULL, 35882af78befSBarry Smith MatGetRowMin_SeqAIJ, 3589f4259b30SLisandro Dalcin NULL, 3590599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3591f4259b30SLisandro Dalcin /*114*/ NULL, 3592f4259b30SLisandro Dalcin NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin /*119*/ NULL, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 3599f4259b30SLisandro Dalcin NULL, 3600b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36010716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3602a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36040da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin /*129*/ NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 360975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3610b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3611b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36122b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3613f4259b30SLisandro Dalcin NULL, 3614f4259b30SLisandro Dalcin NULL, 36153964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3616f4259b30SLisandro Dalcin /*139*/ NULL, 3617f4259b30SLisandro Dalcin NULL, 3618f4259b30SLisandro Dalcin NULL, 36193a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36209c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36214222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36224222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3623f4259b30SLisandro Dalcin NULL, 362472833a62Smarkadams4 NULL, 362572833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36262d776b49SBarry Smith NULL, 3627dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3628dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 362917ab2063SBarry Smith 3630d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3631d71ae5a4SJacob Faibussowitsch { 3632bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 363397f1f81fSBarry Smith PetscInt i, nz, n; 3634bef8e0ddSBarry Smith 3635bef8e0ddSBarry Smith PetscFunctionBegin; 3636bef8e0ddSBarry Smith nz = aij->maxnz; 3637d0f46423SBarry Smith n = mat->rmap->n; 3638ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3639bef8e0ddSBarry Smith aij->nz = nz; 3640ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3642bef8e0ddSBarry Smith } 3643bef8e0ddSBarry Smith 3644a3bb6f32SFande Kong /* 3645ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3646ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3647ddea5d60SJunchao Zhang */ 3648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3649d71ae5a4SJacob Faibussowitsch { 3650a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3651eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3652eec179cfSJacob Faibussowitsch PetscHashIter tpos; 365325b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 365425b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3655a3bb6f32SFande Kong 3656a3bb6f32SFande Kong PetscFunctionBegin; 3657a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3658a3bb6f32SFande Kong PetscValidPointer(mapping, 2); 3659a3bb6f32SFande Kong /* use a table */ 3660eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3661a3bb6f32SFande Kong ec = 0; 366225b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366325b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3664eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3665a3bb6f32SFande Kong if (!data) { 3666a3bb6f32SFande Kong /* one based table */ 3667c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3668a3bb6f32SFande Kong } 3669a3bb6f32SFande Kong } 3670a3bb6f32SFande Kong /* form array of columns we need */ 36719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3672eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3673eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3674eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3675eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3676eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3677a3bb6f32SFande Kong gid--; 3678a3bb6f32SFande Kong lid--; 3679a3bb6f32SFande Kong garray[lid] = gid; 3680a3bb6f32SFande Kong } 36819566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3682eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3683c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3684a3bb6f32SFande Kong /* compact out the extra columns in B */ 368525b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368625b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3687eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3688a3bb6f32SFande Kong lid--; 368925b670f0SStefano Zampini jj[i] = lid; 3690a3bb6f32SFande Kong } 36919566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3692eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36939566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36949566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36959566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3697a3bb6f32SFande Kong } 3698a3bb6f32SFande Kong 3699bef8e0ddSBarry Smith /*@ 3700bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3701bef8e0ddSBarry Smith in the matrix. 3702bef8e0ddSBarry Smith 3703bef8e0ddSBarry Smith Input Parameters: 370411a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3705bef8e0ddSBarry Smith - indices - the column indices 3706bef8e0ddSBarry Smith 370715091d37SBarry Smith Level: advanced 370815091d37SBarry Smith 3709bef8e0ddSBarry Smith Notes: 3710bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3711bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 371211a5261eSBarry Smith of the `MatSetValues()` operation. 3713bef8e0ddSBarry Smith 3714bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371511a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3716bef8e0ddSBarry Smith 371711a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3718bef8e0ddSBarry Smith 3719b9617806SBarry Smith The indices should start with zero, not one. 3720b9617806SBarry Smith 37211cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3722bef8e0ddSBarry Smith @*/ 3723d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3724d71ae5a4SJacob Faibussowitsch { 3725bef8e0ddSBarry Smith PetscFunctionBegin; 37260700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 3727dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 3728cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3730bef8e0ddSBarry Smith } 3731bef8e0ddSBarry Smith 3732d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3733d71ae5a4SJacob Faibussowitsch { 3734be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3735d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3736be6bf707SBarry Smith 3737be6bf707SBarry Smith PetscFunctionBegin; 373828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3739be6bf707SBarry Smith 3740be6bf707SBarry Smith /* allocate space for values if not already there */ 37414dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3742be6bf707SBarry Smith 3743be6bf707SBarry Smith /* copy values over */ 37449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3746be6bf707SBarry Smith } 3747be6bf707SBarry Smith 3748be6bf707SBarry Smith /*@ 374920f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3750be6bf707SBarry Smith nonlinear portion. 3751be6bf707SBarry Smith 3752c3339decSBarry Smith Logically Collect 3753be6bf707SBarry Smith 375427430b45SBarry Smith Input Parameter: 375511a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3756be6bf707SBarry Smith 375715091d37SBarry Smith Level: advanced 375815091d37SBarry Smith 375927430b45SBarry Smith Usage: 376027430b45SBarry Smith .vb 37612ef1f0ffSBarry Smith Using SNES 376227430b45SBarry Smith Create Jacobian matrix 376327430b45SBarry Smith Set linear terms into matrix 376427430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 376527430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 376627430b45SBarry Smith boundary conditions again will not change the nonzero structure 376727430b45SBarry Smith MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 376827430b45SBarry Smith MatStoreValues(mat); 376927430b45SBarry Smith Call SNESSetJacobian() with matrix 377027430b45SBarry Smith In your Jacobian routine 377127430b45SBarry Smith MatRetrieveValues(mat); 377227430b45SBarry Smith Set nonlinear terms in matrix 3773be6bf707SBarry Smith 377427430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 377527430b45SBarry Smith // build linear portion of Jacobian 377627430b45SBarry Smith MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 377727430b45SBarry Smith MatStoreValues(mat); 377827430b45SBarry Smith loop over nonlinear iterations 377927430b45SBarry Smith MatRetrieveValues(mat); 378027430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 378127430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 378227430b45SBarry Smith Solve linear system with Jacobian 378327430b45SBarry Smith endloop 378427430b45SBarry Smith .ve 3785be6bf707SBarry Smith 3786be6bf707SBarry Smith Notes: 3787da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 378811a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3789be6bf707SBarry Smith calling this routine. 3790be6bf707SBarry Smith 37910c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37920c468ba9SBarry Smith and does not allocated additional space. 37930c468ba9SBarry Smith 37941cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `Mat`, `MatRetrieveValues()` 3795be6bf707SBarry Smith @*/ 3796d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3797d71ae5a4SJacob Faibussowitsch { 3798be6bf707SBarry Smith PetscFunctionBegin; 37990700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 380028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 380128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3802cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3804be6bf707SBarry Smith } 3805be6bf707SBarry Smith 3806d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3807d71ae5a4SJacob Faibussowitsch { 3808be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3809d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3810be6bf707SBarry Smith 3811be6bf707SBarry Smith PetscFunctionBegin; 381228b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381328b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3814be6bf707SBarry Smith /* copy values over */ 38159566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3817be6bf707SBarry Smith } 3818be6bf707SBarry Smith 3819be6bf707SBarry Smith /*@ 382020f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3821be6bf707SBarry Smith 3822c3339decSBarry Smith Logically Collect 3823be6bf707SBarry Smith 38242fe279fdSBarry Smith Input Parameter: 382511a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3826be6bf707SBarry Smith 382715091d37SBarry Smith Level: advanced 382815091d37SBarry Smith 38291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3830be6bf707SBarry Smith @*/ 3831d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3832d71ae5a4SJacob Faibussowitsch { 3833be6bf707SBarry Smith PetscFunctionBegin; 38340700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383528b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 383628b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3837cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3839be6bf707SBarry Smith } 3840be6bf707SBarry Smith 384117ab2063SBarry Smith /*@C 384211a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38430d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 384420f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 384520f4b53cSBarry Smith (or the array `nnz`). 384617ab2063SBarry Smith 3847d083f849SBarry Smith Collective 3848db81eaa0SLois Curfman McInnes 384917ab2063SBarry Smith Input Parameters: 385011a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 385117ab2063SBarry Smith . m - number of rows 385217ab2063SBarry Smith . n - number of columns 385317ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385451c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38550298fd71SBarry Smith (possibly different for each row) or NULL 385617ab2063SBarry Smith 385717ab2063SBarry Smith Output Parameter: 3858416022c9SBarry Smith . A - the matrix 385917ab2063SBarry Smith 38602ef1f0ffSBarry Smith Options Database Keys: 38612ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38622ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38632ef1f0ffSBarry Smith 38642ef1f0ffSBarry Smith Level: intermediate 3865175b88e8SBarry Smith 3866b259b22eSLois Curfman McInnes Notes: 38672ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 386849a6f317SBarry Smith 38692ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38702ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38710002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38722ef1f0ffSBarry Smith either one (as in Fortran) or zero. 387317ab2063SBarry Smith 387420f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38752ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 387620f4b53cSBarry Smith allocation. 387717ab2063SBarry Smith 3878682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38794fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3880682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38816c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38826c7ebb05SLois Curfman McInnes 38831cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 388417ab2063SBarry Smith @*/ 3885d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3886d71ae5a4SJacob Faibussowitsch { 38873a40ed3dSBarry Smith PetscFunctionBegin; 38889566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38899566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38909566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3893273d9f13SBarry Smith } 3894273d9f13SBarry Smith 3895273d9f13SBarry Smith /*@C 3896273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3897273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3898273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3899273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3900273d9f13SBarry Smith 3901d083f849SBarry Smith Collective 3902273d9f13SBarry Smith 3903273d9f13SBarry Smith Input Parameters: 39041c4f3114SJed Brown + B - The matrix 3905273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3906273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39070298fd71SBarry Smith (possibly different for each row) or NULL 3908273d9f13SBarry Smith 39092ef1f0ffSBarry Smith Options Database Keys: 39102ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39112ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39122ef1f0ffSBarry Smith 39132ef1f0ffSBarry Smith Level: intermediate 39142ef1f0ffSBarry Smith 3915273d9f13SBarry Smith Notes: 39162ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 391749a6f317SBarry Smith 391811a5261eSBarry Smith The `MATSEQAIJ` format also called 39192ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3920273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3921273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3922273d9f13SBarry Smith 39232ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39242ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39252ef1f0ffSBarry Smith allocation. 3926273d9f13SBarry Smith 392711a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3928aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3929aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3930aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3931aa95bbe8SBarry Smith 393211a5261eSBarry Smith Developer Notes: 393311a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3934a96a251dSBarry Smith entries or columns indices 3935a96a251dSBarry Smith 3936273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3937273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3938273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3939273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3940273d9f13SBarry Smith 39411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3942db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3943273d9f13SBarry Smith @*/ 3944d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3945d71ae5a4SJacob Faibussowitsch { 3946a23d5eceSKris Buschelman PetscFunctionBegin; 39476ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39486ba663aaSJed Brown PetscValidType(B, 1); 3949cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3951a23d5eceSKris Buschelman } 3952a23d5eceSKris Buschelman 3953d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3954d71ae5a4SJacob Faibussowitsch { 3955ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39562576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395797f1f81fSBarry Smith PetscInt i; 3958273d9f13SBarry Smith 3959273d9f13SBarry Smith PetscFunctionBegin; 3960ad79cf63SBarry Smith if (B->hash_active) { 3961ad79cf63SBarry Smith PetscCall(PetscMemcpy(&B->ops, &b->cops, sizeof(*(B->ops)))); 3962ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3963ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3964ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3965ad79cf63SBarry Smith } 39662576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3967a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3968c461c341SBarry Smith skipallocation = PETSC_TRUE; 3969c461c341SBarry Smith nz = 0; 3970c461c341SBarry Smith } 39719566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39729566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3973899cda47SBarry Smith 3974435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 397508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3976cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3977d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 397808401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 397908401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3980b73539f3SBarry Smith } 3981b73539f3SBarry Smith } 3982b73539f3SBarry Smith 3983273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3984ab93d7beSBarry Smith if (!skipallocation) { 39854dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3986071fcb05SBarry Smith if (!b->ilen) { 3987071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39889566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3989071fcb05SBarry Smith } else { 39909566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39912ee49352SLisandro Dalcin } 3992aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3993273d9f13SBarry Smith if (!nnz) { 3994435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3995c62bd62aSJed Brown else if (nz < 0) nz = 1; 39965d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3997d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3998d0f46423SBarry Smith nz = nz * B->rmap->n; 3999273d9f13SBarry Smith } else { 4000c73702f5SBarry Smith PetscInt64 nz64 = 0; 40019371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40029371c9d4SSatish Balay b->imax[i] = nnz[i]; 40039371c9d4SSatish Balay nz64 += nnz[i]; 40049371c9d4SSatish Balay } 40059566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4006273d9f13SBarry Smith } 4007ab93d7beSBarry Smith 4008273d9f13SBarry Smith /* allocate the matrix space */ 400953dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40109566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4011396832f4SHong Zhang if (B->structure_only) { 40129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4014396832f4SHong Zhang } else { 40159566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4016396832f4SHong Zhang } 4017bfeeae90SHong Zhang b->i[0] = 0; 4018ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4019396832f4SHong Zhang if (B->structure_only) { 4020396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4021396832f4SHong Zhang b->free_a = PETSC_FALSE; 4022396832f4SHong Zhang } else { 4023273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4024e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4025396832f4SHong Zhang } 4026e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4027c461c341SBarry Smith } else { 4028e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4029e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4030c461c341SBarry Smith } 4031273d9f13SBarry Smith 4032846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4033846b4da1SFande Kong /* reserve user-requested sparsity */ 40349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4035846b4da1SFande Kong } 4036846b4da1SFande Kong 4037273d9f13SBarry Smith b->nz = 0; 4038273d9f13SBarry Smith b->maxnz = nz; 4039273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40401baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4041cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4042cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40435519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40445519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40455519a089SJose E. Roman */ 40465519a089SJose E. Roman B->nonzerostate++; 40473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4048273d9f13SBarry Smith } 4049273d9f13SBarry Smith 4050d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4051d71ae5a4SJacob Faibussowitsch { 4052846b4da1SFande Kong Mat_SeqAIJ *a; 4053a5bbaf83SFande Kong PetscInt i; 40541f14be2bSBarry Smith PetscBool skipreset; 4055846b4da1SFande Kong 4056846b4da1SFande Kong PetscFunctionBegin; 4057846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405814d0e64fSAlex Lindsay 405914d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40603ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 406114d0e64fSAlex Lindsay 4062846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40632c814fdeSFande Kong /* if no saved info, we error out */ 406428b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40652c814fdeSFande Kong 40661f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40672c814fdeSFande Kong 40681f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40691f14be2bSBarry Smith if (!skipreset) { 40709566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40719566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4072846b4da1SFande Kong a->i[0] = 0; 4073ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4074846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4075846b4da1SFande Kong a->nz = 0; 4076846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4077846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4078846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4079846b4da1SFande Kong A->assembled = PETSC_FALSE; 40801f14be2bSBarry Smith } 40813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4082846b4da1SFande Kong } 4083846b4da1SFande Kong 408458d36128SBarry Smith /*@ 408511a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4086a1661176SMatthew Knepley 4087a1661176SMatthew Knepley Input Parameters: 4088a1661176SMatthew Knepley + B - the matrix 4089a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4090a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4091a1661176SMatthew Knepley - v - optional values in the matrix 4092a1661176SMatthew Knepley 4093a1661176SMatthew Knepley Level: developer 4094a1661176SMatthew Knepley 40956a9b8d82SBarry Smith Notes: 40962ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 409758d36128SBarry Smith 40986a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40996a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41006a9b8d82SBarry Smith 41016a9b8d82SBarry Smith Developer Notes: 41022ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41032ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41046a9b8d82SBarry Smith 410511a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41066a9b8d82SBarry Smith 41071cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()` 4108a1661176SMatthew Knepley @*/ 4109d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4110d71ae5a4SJacob Faibussowitsch { 4111a1661176SMatthew Knepley PetscFunctionBegin; 41120700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41136ba663aaSJed Brown PetscValidType(B, 1); 4114cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4116a1661176SMatthew Knepley } 4117a1661176SMatthew Knepley 4118d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4119d71ae5a4SJacob Faibussowitsch { 4120a1661176SMatthew Knepley PetscInt i; 4121a1661176SMatthew Knepley PetscInt m, n; 4122a1661176SMatthew Knepley PetscInt nz; 41236a9b8d82SBarry Smith PetscInt *nnz; 4124a1661176SMatthew Knepley 4125a1661176SMatthew Knepley PetscFunctionBegin; 4126aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4127779a8d59SSatish Balay 41289566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4130779a8d59SSatish Balay 41319566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4133a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4134b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 413508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4136a1661176SMatthew Knepley nnz[i] = nz; 4137a1661176SMatthew Knepley } 41389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41399566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4140a1661176SMatthew Knepley 414148a46eb9SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4142a1661176SMatthew Knepley 41439566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41449566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4145a1661176SMatthew Knepley 41469566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4148a1661176SMatthew Knepley } 4149a1661176SMatthew Knepley 4150ad7e164aSPierre Jolivet /*@ 41512ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4152ad7e164aSPierre Jolivet 4153ad7e164aSPierre Jolivet Input Parameters: 4154ad7e164aSPierre Jolivet + A - left-hand side matrix 4155ad7e164aSPierre Jolivet . B - right-hand side matrix 415611a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4157ad7e164aSPierre Jolivet 4158ad7e164aSPierre Jolivet Output Parameter: 41592ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4160ad7e164aSPierre Jolivet 4161ad7e164aSPierre Jolivet Level: intermediate 4162ad7e164aSPierre Jolivet 416311a5261eSBarry Smith Note: 416411a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4165ad7e164aSPierre Jolivet 41661cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4167ad7e164aSPierre Jolivet @*/ 4168d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4169d71ae5a4SJacob Faibussowitsch { 4170ad7e164aSPierre Jolivet PetscFunctionBegin; 4171ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4172ad7e164aSPierre Jolivet PetscValidType(A, 1); 4173ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4174ad7e164aSPierre Jolivet PetscValidType(B, 2); 4175ad7e164aSPierre Jolivet PetscValidPointer(C, 4); 4176ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4177ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4178ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4179ad7e164aSPierre Jolivet } 4180cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4182ad7e164aSPierre Jolivet } 4183ad7e164aSPierre Jolivet 4184d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4185d71ae5a4SJacob Faibussowitsch { 4186ad7e164aSPierre Jolivet Mat newmat; 4187ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4188ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4189ad7e164aSPierre Jolivet PetscScalar *v; 4190fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4191ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4192ad7e164aSPierre Jolivet PetscBool flg; 4193ad7e164aSPierre Jolivet 4194ad7e164aSPierre Jolivet PetscFunctionBegin; 419528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419628b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 419728b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419828b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41999566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 420028b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4201aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4202ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42039566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42049566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42059566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42069566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4207ad7e164aSPierre Jolivet i[0] = 0; 4208ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4209ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4210ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4211ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4212ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4213ad7e164aSPierre Jolivet } 4214ad7e164aSPierre Jolivet } 4215ad7e164aSPierre Jolivet } 42169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4217ad7e164aSPierre Jolivet *C = newmat; 42189566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4219ad7e164aSPierre Jolivet nnz = 0; 4220ad7e164aSPierre Jolivet } 42219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4224ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4225ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4226ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4227ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4228ad7e164aSPierre Jolivet } 4229ad7e164aSPierre Jolivet } 4230ad7e164aSPierre Jolivet } 42319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4235ad7e164aSPierre Jolivet } 4236ad7e164aSPierre Jolivet 4237c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4238af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4239170fe5c8SBarry Smith 4240170fe5c8SBarry Smith /* 4241170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4242170fe5c8SBarry Smith 4243170fe5c8SBarry Smith n p p 42442da392ccSBarry Smith [ ] [ ] [ ] 42452da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42462da392ccSBarry Smith [ ] [ ] [ ] 4247170fe5c8SBarry Smith 4248170fe5c8SBarry Smith */ 4249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4250d71ae5a4SJacob Faibussowitsch { 4251170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4252170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4253170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 425486214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4255170fe5c8SBarry Smith const PetscInt *ii, *idx; 4256170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4257170fe5c8SBarry Smith PetscScalar *c, *c_q; 425886214ceeSStefano Zampini PetscInt clda = sub_c->lda; 425986214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4260170fe5c8SBarry Smith 4261170fe5c8SBarry Smith PetscFunctionBegin; 4262d0f46423SBarry Smith m = A->rmap->n; 4263d0f46423SBarry Smith n = A->cmap->n; 4264d0f46423SBarry Smith p = B->cmap->n; 4265170fe5c8SBarry Smith a = sub_a->v; 4266170fe5c8SBarry Smith b = sub_b->a; 4267170fe5c8SBarry Smith c = sub_c->v; 426886214ceeSStefano Zampini if (clda == m) { 42699566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 427086214ceeSStefano Zampini } else { 427186214ceeSStefano Zampini for (j = 0; j < p; j++) 42729371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 427386214ceeSStefano Zampini } 4274170fe5c8SBarry Smith ii = sub_b->i; 4275170fe5c8SBarry Smith idx = sub_b->j; 4276170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4277170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4278170fe5c8SBarry Smith while (q-- > 0) { 427986214ceeSStefano Zampini c_q = c + clda * (*idx); 428086214ceeSStefano Zampini a_q = a + alda * i; 4281854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4282170fe5c8SBarry Smith idx++; 4283170fe5c8SBarry Smith b++; 4284170fe5c8SBarry Smith } 4285170fe5c8SBarry Smith } 42863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4287170fe5c8SBarry Smith } 4288170fe5c8SBarry Smith 4289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4290d71ae5a4SJacob Faibussowitsch { 4291d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 429286214ceeSStefano Zampini PetscBool cisdense; 4293170fe5c8SBarry Smith 4294170fe5c8SBarry Smith PetscFunctionBegin; 429508401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42969566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42979566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4298d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 429948a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43009566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4301d73949e8SHong Zhang 43024222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4304170fe5c8SBarry Smith } 4305170fe5c8SBarry Smith 43060bad9183SKris Buschelman /*MC 4307fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43080bad9183SKris Buschelman based on compressed sparse row format. 43090bad9183SKris Buschelman 43102ef1f0ffSBarry Smith Options Database Key: 43110bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43120bad9183SKris Buschelman 43130bad9183SKris Buschelman Level: beginner 43140bad9183SKris Buschelman 43150cd7f59aSBarry Smith Notes: 43162ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43170cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43180cd7f59aSBarry Smith in the matrix 43190cd7f59aSBarry Smith 432011a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 432111a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43220cd7f59aSBarry Smith 432311a5261eSBarry Smith Developer Note: 43242ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43250cd7f59aSBarry Smith 43261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43270bad9183SKris Buschelman M*/ 43280bad9183SKris Buschelman 4329ccd284c7SBarry Smith /*MC 4330ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4331ccd284c7SBarry Smith 433211a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 433311a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 433411a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4335ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4336ccd284c7SBarry Smith the above preallocation routines for simplicity. 4337ccd284c7SBarry Smith 43382ef1f0ffSBarry Smith Options Database Key: 433911a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4340ccd284c7SBarry Smith 43412ef1f0ffSBarry Smith Level: beginner 43422ef1f0ffSBarry Smith 434311a5261eSBarry Smith Note: 434411a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4345ccd284c7SBarry Smith enough exist. 4346ccd284c7SBarry Smith 43471cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4348ccd284c7SBarry Smith M*/ 4349ccd284c7SBarry Smith 4350ccd284c7SBarry Smith /*MC 4351ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4352ccd284c7SBarry Smith 43532ef1f0ffSBarry Smith Options Database Key: 43542ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43552ef1f0ffSBarry Smith 43562ef1f0ffSBarry Smith Level: beginner 43572ef1f0ffSBarry Smith 43582ef1f0ffSBarry Smith Note: 435911a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 436011a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 436111a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4362ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4363ccd284c7SBarry Smith the above preallocation routines for simplicity. 4364ccd284c7SBarry Smith 43651cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4366ccd284c7SBarry Smith M*/ 4367ccd284c7SBarry Smith 43687906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43697906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43707906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43717906f579SHong Zhang #endif 4372d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4373d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4374d24d4204SJose E. Roman #endif 43757906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43767906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43777906f579SHong Zhang #endif 43787906f579SHong Zhang 4379d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4380c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43814222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43827906f579SHong Zhang 43838c778c55SBarry Smith /*@C 438411a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43858c778c55SBarry Smith 43868c778c55SBarry Smith Not Collective 43878c778c55SBarry Smith 43888c778c55SBarry Smith Input Parameter: 438911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 43908c778c55SBarry Smith 43918c778c55SBarry Smith Output Parameter: 43928c778c55SBarry Smith . array - pointer to the data 43938c778c55SBarry Smith 43948c778c55SBarry Smith Level: intermediate 43958c778c55SBarry Smith 43960ab4885dSBarry Smith Fortran Note: 43970ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 43980ab4885dSBarry Smith 43991cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44008c778c55SBarry Smith @*/ 4401d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4402d71ae5a4SJacob Faibussowitsch { 4403d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44048c778c55SBarry Smith 44058c778c55SBarry Smith PetscFunctionBegin; 4406d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44079566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4408d67d9f35SJunchao Zhang } else { 4409d67d9f35SJunchao Zhang *array = aij->a; 4410d67d9f35SJunchao Zhang } 44113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4412d67d9f35SJunchao Zhang } 4413d67d9f35SJunchao Zhang 4414d67d9f35SJunchao Zhang /*@C 441511a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4416d67d9f35SJunchao Zhang 4417d67d9f35SJunchao Zhang Not Collective 4418d67d9f35SJunchao Zhang 4419d67d9f35SJunchao Zhang Input Parameters: 442011a5261eSBarry Smith + mat - a `MATSEQAIJ` matrix 4421d67d9f35SJunchao Zhang - array - pointer to the data 4422d67d9f35SJunchao Zhang 4423d67d9f35SJunchao Zhang Level: intermediate 4424d67d9f35SJunchao Zhang 44250ab4885dSBarry Smith Fortran Note: 44260ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44270ab4885dSBarry Smith 44281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4429d67d9f35SJunchao Zhang @*/ 4430d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4431d71ae5a4SJacob Faibussowitsch { 4432d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4433d67d9f35SJunchao Zhang 4434d67d9f35SJunchao Zhang PetscFunctionBegin; 4435d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44369566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4437d67d9f35SJunchao Zhang } else { 4438d67d9f35SJunchao Zhang *array = NULL; 4439d67d9f35SJunchao Zhang } 44409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44419566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44438c778c55SBarry Smith } 44448c778c55SBarry Smith 444521e72a00SBarry Smith /*@C 444611a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44478f1ea47aSStefano Zampini 44480ab4885dSBarry Smith Not Collective; No Fortran Support 44498f1ea47aSStefano Zampini 44508f1ea47aSStefano Zampini Input Parameter: 445111a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44528f1ea47aSStefano Zampini 44538f1ea47aSStefano Zampini Output Parameter: 44548f1ea47aSStefano Zampini . array - pointer to the data 44558f1ea47aSStefano Zampini 44568f1ea47aSStefano Zampini Level: intermediate 44578f1ea47aSStefano Zampini 44581cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44598f1ea47aSStefano Zampini @*/ 4460d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4461d71ae5a4SJacob Faibussowitsch { 4462d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44638f1ea47aSStefano Zampini 44648f1ea47aSStefano Zampini PetscFunctionBegin; 4465d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44669566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4467d67d9f35SJunchao Zhang } else { 4468d67d9f35SJunchao Zhang *array = aij->a; 4469d67d9f35SJunchao Zhang } 44703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44718f1ea47aSStefano Zampini } 44728f1ea47aSStefano Zampini 44738f1ea47aSStefano Zampini /*@C 447411a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44758f1ea47aSStefano Zampini 44760ab4885dSBarry Smith Not Collective; No Fortran Support 44778f1ea47aSStefano Zampini 44788f1ea47aSStefano Zampini Input Parameter: 447911a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini Output Parameter: 44828f1ea47aSStefano Zampini . array - pointer to the data 44838f1ea47aSStefano Zampini 44848f1ea47aSStefano Zampini Level: intermediate 44858f1ea47aSStefano Zampini 44861cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44878f1ea47aSStefano Zampini @*/ 4488d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4489d71ae5a4SJacob Faibussowitsch { 4490d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44918f1ea47aSStefano Zampini 44928f1ea47aSStefano Zampini PetscFunctionBegin; 4493d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44949566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4495d67d9f35SJunchao Zhang } else { 4496d67d9f35SJunchao Zhang *array = NULL; 4497d67d9f35SJunchao Zhang } 44983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4499d67d9f35SJunchao Zhang } 4500d67d9f35SJunchao Zhang 4501d67d9f35SJunchao Zhang /*@C 450211a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4503d67d9f35SJunchao Zhang 45040ab4885dSBarry Smith Not Collective; No Fortran Support 4505d67d9f35SJunchao Zhang 4506d67d9f35SJunchao Zhang Input Parameter: 450711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 4508d67d9f35SJunchao Zhang 4509d67d9f35SJunchao Zhang Output Parameter: 4510d67d9f35SJunchao Zhang . array - pointer to the data 4511d67d9f35SJunchao Zhang 4512d67d9f35SJunchao Zhang Level: intermediate 4513d67d9f35SJunchao Zhang 45141cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4515d67d9f35SJunchao Zhang @*/ 4516d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4517d71ae5a4SJacob Faibussowitsch { 4518d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4519d67d9f35SJunchao Zhang 4520d67d9f35SJunchao Zhang PetscFunctionBegin; 4521d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45229566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4523d67d9f35SJunchao Zhang } else { 4524d67d9f35SJunchao Zhang *array = aij->a; 4525d67d9f35SJunchao Zhang } 45269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45279566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4529d67d9f35SJunchao Zhang } 4530d67d9f35SJunchao Zhang 4531d67d9f35SJunchao Zhang /*@C 4532d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4533d67d9f35SJunchao Zhang 45340ab4885dSBarry Smith Not Collective; No Fortran Support 4535d67d9f35SJunchao Zhang 4536d67d9f35SJunchao Zhang Input Parameter: 4537d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4538d67d9f35SJunchao Zhang 4539d67d9f35SJunchao Zhang Output Parameter: 4540d67d9f35SJunchao Zhang . array - pointer to the data 4541d67d9f35SJunchao Zhang 4542d67d9f35SJunchao Zhang Level: intermediate 4543d67d9f35SJunchao Zhang 45441cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4545d67d9f35SJunchao Zhang @*/ 4546d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4547d71ae5a4SJacob Faibussowitsch { 4548d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4549d67d9f35SJunchao Zhang 4550d67d9f35SJunchao Zhang PetscFunctionBegin; 4551d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45529566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4553d67d9f35SJunchao Zhang } else { 4554d67d9f35SJunchao Zhang *array = NULL; 4555d67d9f35SJunchao Zhang } 45563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45578f1ea47aSStefano Zampini } 45588f1ea47aSStefano Zampini 45598f1ea47aSStefano Zampini /*@C 456011a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45617ee59b9bSJunchao Zhang 45620ab4885dSBarry Smith Not Collective; No Fortran Support 45637ee59b9bSJunchao Zhang 45647ee59b9bSJunchao Zhang Input Parameter: 456511a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45667ee59b9bSJunchao Zhang 45677ee59b9bSJunchao Zhang Output Parameters: 45687ee59b9bSJunchao Zhang + i - row map array of the matrix 45697ee59b9bSJunchao Zhang . j - column index array of the matrix 45707ee59b9bSJunchao Zhang . a - data array of the matrix 45717ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45727ee59b9bSJunchao Zhang 45732ef1f0ffSBarry Smith Level: Developer 45742ef1f0ffSBarry Smith 45757ee59b9bSJunchao Zhang Notes: 45762ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45777ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45787ee59b9bSJunchao Zhang 45797ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45802ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45817ee59b9bSJunchao Zhang 45821cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45837ee59b9bSJunchao Zhang @*/ 4584d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4585d71ae5a4SJacob Faibussowitsch { 45867ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45877ee59b9bSJunchao Zhang 45887ee59b9bSJunchao Zhang PetscFunctionBegin; 45897ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45907ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45917ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45927ee59b9bSJunchao Zhang } else { 45937ee59b9bSJunchao Zhang if (i) *i = aij->i; 45947ee59b9bSJunchao Zhang if (j) *j = aij->j; 45957ee59b9bSJunchao Zhang if (a) *a = aij->a; 45967ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45977ee59b9bSJunchao Zhang } 45983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45997ee59b9bSJunchao Zhang } 46007ee59b9bSJunchao Zhang 46017ee59b9bSJunchao Zhang /*@C 460221e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 460321e72a00SBarry Smith 460421e72a00SBarry Smith Not Collective 460521e72a00SBarry Smith 460621e72a00SBarry Smith Input Parameter: 460711a5261eSBarry Smith . mat - a `MATSEQAIJ` matrix 460821e72a00SBarry Smith 460921e72a00SBarry Smith Output Parameter: 461021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 461121e72a00SBarry Smith 461221e72a00SBarry Smith Level: intermediate 461321e72a00SBarry Smith 46141cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 461521e72a00SBarry Smith @*/ 4616d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4617d71ae5a4SJacob Faibussowitsch { 461821e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 461921e72a00SBarry Smith 462021e72a00SBarry Smith PetscFunctionBegin; 462121e72a00SBarry Smith *nz = aij->rmax; 46223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 462321e72a00SBarry Smith } 462421e72a00SBarry Smith 4625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4626d71ae5a4SJacob Faibussowitsch { 4627394ed5ebSJunchao Zhang MPI_Comm comm; 4628394ed5ebSJunchao Zhang PetscInt *i, *j; 4629394ed5ebSJunchao Zhang PetscInt M, N, row; 4630394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4631394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4632394ed5ebSJunchao Zhang PetscInt *Aj; 4633394ed5ebSJunchao Zhang PetscScalar *Aa; 4634cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4635cbc6b225SStefano Zampini MatType rtype; 4636394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 4637394ed5ebSJunchao Zhang 4638394ed5ebSJunchao Zhang PetscFunctionBegin; 46399566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46409566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46419566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4642e8729f6fSJunchao Zhang i = coo_i; 4643e8729f6fSJunchao Zhang j = coo_j; 46449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4645394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4646394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4647394ed5ebSJunchao Zhang perm[k] = k; 4648394ed5ebSJunchao Zhang } 4649394ed5ebSJunchao Zhang 4650394ed5ebSJunchao Zhang /* Sort by row */ 46519566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 46529371c9d4SSatish Balay for (k = 0; k < coo_n; k++) { 46539371c9d4SSatish Balay if (i[k] >= 0) break; 46549371c9d4SSatish Balay } /* Advance k to the first row with a non-negative index */ 4655394ed5ebSJunchao Zhang nneg = k; 46569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4657394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 465835cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4659394ed5ebSJunchao Zhang 46609566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4662394ed5ebSJunchao Zhang 4663394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 466435cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4665394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4666394ed5ebSJunchao Zhang while (k < coo_n) { 4667394ed5ebSJunchao Zhang row = i[k]; 4668394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4669394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4670394ed5ebSJunchao Zhang end = k; 46719566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4672394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4673394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4674394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4675394ed5ebSJunchao Zhang Ai[row] = 1; 4676394ed5ebSJunchao Zhang nnz++; 4677394ed5ebSJunchao Zhang 4678394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4679394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4680394ed5ebSJunchao Zhang q++; 4681394ed5ebSJunchao Zhang jmap[q] = 1; 4682394ed5ebSJunchao Zhang Aj[q] = j[p]; 4683394ed5ebSJunchao Zhang Ai[row]++; 4684394ed5ebSJunchao Zhang nnz++; 4685394ed5ebSJunchao Zhang } else { 4686394ed5ebSJunchao Zhang jmap[q]++; 4687394ed5ebSJunchao Zhang } 4688394ed5ebSJunchao Zhang } 4689394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4690394ed5ebSJunchao Zhang } 4691394ed5ebSJunchao Zhang 4692394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4693394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4694394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4695394ed5ebSJunchao Zhang jmap[0] = 0; 4696394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4697394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4698394ed5ebSJunchao Zhang PetscCount *jmap_new; 4699394ed5ebSJunchao Zhang PetscInt *Aj_new; 4700394ed5ebSJunchao Zhang 47019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47039566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4704394ed5ebSJunchao Zhang jmap = jmap_new; 4705394ed5ebSJunchao Zhang 47069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 47079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47089566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4709394ed5ebSJunchao Zhang Aj = Aj_new; 4710394ed5ebSJunchao Zhang } 4711394ed5ebSJunchao Zhang 4712394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4713394ed5ebSJunchao Zhang PetscCount *perm_new; 4714cbc6b225SStefano Zampini 47159566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47169566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47179566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4718394ed5ebSJunchao Zhang perm = perm_new; 4719394ed5ebSJunchao Zhang } 4720394ed5ebSJunchao Zhang 47219566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47229566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47239566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4724394ed5ebSJunchao Zhang 4725394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4726394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4727394ed5ebSJunchao Zhang /* Record COO fields */ 4728394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4729394ed5ebSJunchao Zhang seqaij->Atot = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */ 4730394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4731394ed5ebSJunchao Zhang seqaij->perm = perm; 47323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4733394ed5ebSJunchao Zhang } 4734394ed5ebSJunchao Zhang 4735d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4736d71ae5a4SJacob Faibussowitsch { 4737394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4738394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 4739394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm, *jmap = aseq->jmap; 4740394ed5ebSJunchao Zhang PetscScalar *Aa; 4741394ed5ebSJunchao Zhang 4742394ed5ebSJunchao Zhang PetscFunctionBegin; 47439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4744394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4745b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4746b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4747b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4748394ed5ebSJunchao Zhang } 47499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 47503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4751394ed5ebSJunchao Zhang } 4752394ed5ebSJunchao Zhang 475334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47545063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 475502fe1965SBarry Smith #endif 4756d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4757d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4758d5e393b6SSuyash Tandon #endif 47593d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47605063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 47613d0639e7SStefano Zampini #endif 476202fe1965SBarry Smith 4763d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4764d71ae5a4SJacob Faibussowitsch { 4765273d9f13SBarry Smith Mat_SeqAIJ *b; 476638baddfdSBarry Smith PetscMPIInt size; 4767273d9f13SBarry Smith 4768273d9f13SBarry Smith PetscFunctionBegin; 47699566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 477008401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4771273d9f13SBarry Smith 47724dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 47732205254eSKarl Rupp 4774b0a32e0cSBarry Smith B->data = (void *)b; 47752205254eSKarl Rupp 47769566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 4777071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47782205254eSKarl Rupp 4779f4259b30SLisandro Dalcin b->row = NULL; 4780f4259b30SLisandro Dalcin b->col = NULL; 4781f4259b30SLisandro Dalcin b->icol = NULL; 4782b810aeb4SBarry Smith b->reallocs = 0; 478336db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4784f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4785416022c9SBarry Smith b->nonew = 0; 4786f4259b30SLisandro Dalcin b->diag = NULL; 4787f4259b30SLisandro Dalcin b->solve_work = NULL; 4788f4259b30SLisandro Dalcin B->spptr = NULL; 4789f4259b30SLisandro Dalcin b->saved_values = NULL; 4790f4259b30SLisandro Dalcin b->idiag = NULL; 4791f4259b30SLisandro Dalcin b->mdiag = NULL; 4792f4259b30SLisandro Dalcin b->ssor_work = NULL; 479371f1c65dSBarry Smith b->omega = 1.0; 479471f1c65dSBarry Smith b->fshift = 0.0; 479571f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4796bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4797a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 479817ab2063SBarry Smith 47999566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4800d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4803b3866ffcSBarry Smith #endif 48049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 48069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 48079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48119779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4813191b95cbSRichard Tran Mills #endif 481434b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 481802fe1965SBarry Smith #endif 4819d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4820d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4821d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4822d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4823d5e393b6SSuyash Tandon #endif 48243d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48263d0639e7SStefano Zampini #endif 48279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4828af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4830af8000cdSHong Zhang #endif 4831d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4833d24d4204SJose E. Roman #endif 483463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 483763c07aadSStefano Zampini #endif 48389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48539566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 48559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 485717ab2063SBarry Smith } 485817ab2063SBarry Smith 4859b24902e0SBarry Smith /* 48603893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4861b24902e0SBarry Smith */ 4862d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4863d71ae5a4SJacob Faibussowitsch { 48642a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4865071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 486617ab2063SBarry Smith 48673a40ed3dSBarry Smith PetscFunctionBegin; 4868aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4869273d9f13SBarry Smith 4870d5f3da31SBarry Smith C->factortype = A->factortype; 4871f4259b30SLisandro Dalcin c->row = NULL; 4872f4259b30SLisandro Dalcin c->col = NULL; 4873f4259b30SLisandro Dalcin c->icol = NULL; 48746ad4291fSHong Zhang c->reallocs = 0; 487517ab2063SBarry Smith 487669272f91SPierre Jolivet C->assembled = A->assembled; 487717ab2063SBarry Smith 487869272f91SPierre Jolivet if (A->preallocated) { 48799566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 48809566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4881eec197d1SBarry Smith 488231fe6a7dSBarry Smith if (!A->hash_active) { 48839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 48849566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 48859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 48869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 488717ab2063SBarry Smith 488817ab2063SBarry Smith /* allocate the matrix space */ 4889f77e22a1SHong Zhang if (mallocmatspace) { 48909566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 48912205254eSKarl Rupp 4892f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 48932205254eSKarl Rupp 48949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 489517ab2063SBarry Smith if (m > 0) { 48969566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4897be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 48982e5835c6SStefano Zampini const PetscScalar *aa; 48992e5835c6SStefano Zampini 49009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4903be6bf707SBarry Smith } else { 49049566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 490517ab2063SBarry Smith } 490608480c60SBarry Smith } 4907f77e22a1SHong Zhang } 490831fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 490931fe6a7dSBarry Smith } else { 491031fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 491131fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 491231fe6a7dSBarry Smith } 491317ab2063SBarry Smith 49146ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4915416022c9SBarry Smith c->roworiented = a->roworiented; 4916416022c9SBarry Smith c->nonew = a->nonew; 4917416022c9SBarry Smith if (a->diag) { 49189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 49199566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4920071fcb05SBarry Smith } else c->diag = NULL; 49212205254eSKarl Rupp 4922f4259b30SLisandro Dalcin c->solve_work = NULL; 4923f4259b30SLisandro Dalcin c->saved_values = NULL; 4924f4259b30SLisandro Dalcin c->idiag = NULL; 4925f4259b30SLisandro Dalcin c->ssor_work = NULL; 4926a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4927e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4928e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49296ad4291fSHong Zhang 4930893ad86cSHong Zhang c->rmax = a->rmax; 4931416022c9SBarry Smith c->nz = a->nz; 49328ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4933754ec7b1SSatish Balay 49346ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49356ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4936cd6b891eSBarry Smith if (a->compressedrow.use) { 49376ad4291fSHong Zhang i = a->compressedrow.nrows; 49389566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49399566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 494127ea64f8SHong Zhang } else { 494227ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49430298fd71SBarry Smith c->compressedrow.i = NULL; 49440298fd71SBarry Smith c->compressedrow.rindex = NULL; 49456ad4291fSHong Zhang } 4946ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4947e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49484846f1f5SKris Buschelman 49499566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 495069272f91SPierre Jolivet } 49519566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 495317ab2063SBarry Smith } 495417ab2063SBarry Smith 4955d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 4956d71ae5a4SJacob Faibussowitsch { 4957b24902e0SBarry Smith PetscFunctionBegin; 49589566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 49599566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 496048a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 49619566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 49629566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 49633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4964b24902e0SBarry Smith } 4965b24902e0SBarry Smith 4966d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4967d71ae5a4SJacob Faibussowitsch { 496852f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 496952f91c60SVaclav Hapla 497052f91c60SVaclav Hapla PetscFunctionBegin; 497152f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 497252f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 4973c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49749566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49759566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 49769566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 497752f91c60SVaclav Hapla if (isbinary) { 49789566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 497952f91c60SVaclav Hapla } else if (ishdf5) { 498052f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49819566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 498252f91c60SVaclav Hapla #else 498352f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 498452f91c60SVaclav Hapla #endif 498552f91c60SVaclav Hapla } else { 498698921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 498752f91c60SVaclav Hapla } 49883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 498952f91c60SVaclav Hapla } 499052f91c60SVaclav Hapla 4991d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 4992d71ae5a4SJacob Faibussowitsch { 49933ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 49943ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 4995fbdbba38SShri Abhyankar 4996fbdbba38SShri Abhyankar PetscFunctionBegin; 49979566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 4998bbead8a2SBarry Smith 49993ea6fe3dSLisandro Dalcin /* read in matrix header */ 50009566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 500108401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50029371c9d4SSatish Balay M = header[1]; 50039371c9d4SSatish Balay N = header[2]; 50049371c9d4SSatish Balay nz = header[3]; 500508401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 500608401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 500708401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5008fbdbba38SShri Abhyankar 50093ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50109566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 50113ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50123ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50133ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50143ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50153ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50169566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50179566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50183ea6fe3dSLisandro Dalcin 50193ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50209566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5021aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50223ea6fe3dSLisandro Dalcin 5023fbdbba38SShri Abhyankar /* read in row lengths */ 50249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50259566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50263ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50279371c9d4SSatish Balay sum = 0; 50289371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 502908401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50303ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50329566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5033aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50343ea6fe3dSLisandro Dalcin /* store row lengths */ 50359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50369566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5037fbdbba38SShri Abhyankar 50383ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50399371c9d4SSatish Balay a->i[0] = 0; 50409371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50413ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50429566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50433ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50449566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5045fbdbba38SShri Abhyankar 50469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 50483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5049fbdbba38SShri Abhyankar } 5050fbdbba38SShri Abhyankar 5051d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5052d71ae5a4SJacob Faibussowitsch { 50537264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5054fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5055eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5056eeffb40dSHong Zhang PetscInt k; 5057eeffb40dSHong Zhang #endif 50587264ac53SSatish Balay 50593a40ed3dSBarry Smith PetscFunctionBegin; 5060bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5061d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5062ca44d042SBarry Smith *flg = PETSC_FALSE; 50633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5064bcd2baecSBarry Smith } 50657264ac53SSatish Balay 50667264ac53SSatish Balay /* if the a->i are the same */ 50679566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 50683ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 50697264ac53SSatish Balay 50707264ac53SSatish Balay /* if a->j are the same */ 50719566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 50723ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5073bcd2baecSBarry Smith 50749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5076bcd2baecSBarry Smith /* if a->a are the same */ 5077eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5078eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5079fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5080eeffb40dSHong Zhang *flg = PETSC_FALSE; 50813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5082eeffb40dSHong Zhang } 5083eeffb40dSHong Zhang } 5084eeffb40dSHong Zhang #else 50859566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5086eeffb40dSHong Zhang #endif 50879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 50889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 50893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 50907264ac53SSatish Balay } 509136db0b34SBarry Smith 509205869f15SSatish Balay /*@ 509311a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 509436db0b34SBarry Smith provided by the user. 509536db0b34SBarry Smith 5096d083f849SBarry Smith Collective 509736db0b34SBarry Smith 509836db0b34SBarry Smith Input Parameters: 509936db0b34SBarry Smith + comm - must be an MPI communicator of size 1 510036db0b34SBarry Smith . m - number of rows 510136db0b34SBarry Smith . n - number of columns 5102483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 510336db0b34SBarry Smith . j - column indices 510436db0b34SBarry Smith - a - matrix values 510536db0b34SBarry Smith 510636db0b34SBarry Smith Output Parameter: 510736db0b34SBarry Smith . mat - the matrix 510836db0b34SBarry Smith 510936db0b34SBarry Smith Level: intermediate 511036db0b34SBarry Smith 511136db0b34SBarry Smith Notes: 51122ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5113292fb18eSBarry Smith once the matrix is destroyed and not before 511436db0b34SBarry Smith 511536db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 511636db0b34SBarry Smith 51172ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 511836db0b34SBarry Smith 5119a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5120a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51218eef79e4SBarry Smith as shown 51222ef1f0ffSBarry Smith .vb 51232ef1f0ffSBarry Smith 1 0 0 51242ef1f0ffSBarry Smith 2 0 3 51252ef1f0ffSBarry Smith 4 5 6 5126a4552177SSatish Balay 51272ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 51282ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51292ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 51302ef1f0ffSBarry Smith .ve 5131a4552177SSatish Balay 51321cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 513336db0b34SBarry Smith @*/ 5134d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5135d71ae5a4SJacob Faibussowitsch { 5136cbcfb4deSHong Zhang PetscInt ii; 513736db0b34SBarry Smith Mat_SeqAIJ *aij; 5138cbcfb4deSHong Zhang PetscInt jj; 513936db0b34SBarry Smith 514036db0b34SBarry Smith PetscFunctionBegin; 5141aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51429566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51439566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51449566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51459566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5147ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5150ab93d7beSBarry Smith 515136db0b34SBarry Smith aij->i = i; 515236db0b34SBarry Smith aij->j = j; 515336db0b34SBarry Smith aij->a = a; 515436db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 515536db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5156e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5157e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 515836db0b34SBarry Smith 5159cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 516036db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 516176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5162aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 51639985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 516408401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 516508401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 51669985e31cSBarry Smith } 516736db0b34SBarry Smith } 516876bd3646SJed Brown } 516976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 517036db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 517108401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5172aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 517336db0b34SBarry Smith } 517476bd3646SJed Brown } 517536db0b34SBarry Smith 51769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 51779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 51783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 517936db0b34SBarry Smith } 5180cbc6b225SStefano Zampini 5181f62e3866SBarry Smith /*@ 518211a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 51838a0b0e6bSVictor Minden provided by the user. 51848a0b0e6bSVictor Minden 5185d083f849SBarry Smith Collective 51868a0b0e6bSVictor Minden 51878a0b0e6bSVictor Minden Input Parameters: 51888a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51898a0b0e6bSVictor Minden . m - number of rows 51908a0b0e6bSVictor Minden . n - number of columns 51918a0b0e6bSVictor Minden . i - row indices 51928a0b0e6bSVictor Minden . j - column indices 51931230e6d1SVictor Minden . a - matrix values 51941230e6d1SVictor Minden . nz - number of nonzeros 51952ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 51968a0b0e6bSVictor Minden 51978a0b0e6bSVictor Minden Output Parameter: 51988a0b0e6bSVictor Minden . mat - the matrix 51998a0b0e6bSVictor Minden 52008a0b0e6bSVictor Minden Level: intermediate 52018a0b0e6bSVictor Minden 5202f62e3866SBarry Smith Example: 5203f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52049e99939fSJunchao Zhang .vb 52058a0b0e6bSVictor Minden 1 0 0 52068a0b0e6bSVictor Minden 2 0 3 52078a0b0e6bSVictor Minden 4 5 6 52088a0b0e6bSVictor Minden 52098a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52108a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52118a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52129e99939fSJunchao Zhang .ve 52132ef1f0ffSBarry Smith Note: 5214d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5215d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52168a0b0e6bSVictor Minden 52171cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52188a0b0e6bSVictor Minden @*/ 5219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5220d71ae5a4SJacob Faibussowitsch { 5221d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52228a0b0e6bSVictor Minden 52238a0b0e6bSVictor Minden PetscFunctionBegin; 52249566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5225ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52269566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52279566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52289566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52301230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52311230e6d1SVictor Minden if (idx) { 52321230e6d1SVictor Minden row = i[ii] - 1; 52331230e6d1SVictor Minden col = j[ii] - 1; 52341230e6d1SVictor Minden } else { 52351230e6d1SVictor Minden row = i[ii]; 52361230e6d1SVictor Minden col = j[ii]; 52378a0b0e6bSVictor Minden } 52389566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52398a0b0e6bSVictor Minden } 52409566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52419566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52429566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52448a0b0e6bSVictor Minden } 524536db0b34SBarry Smith 5246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5247d71ae5a4SJacob Faibussowitsch { 5248acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5249acf2f550SJed Brown 5250acf2f550SJed Brown PetscFunctionBegin; 5251acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5252acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52532205254eSKarl Rupp 52549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 52553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5256acf2f550SJed Brown } 5257acf2f550SJed Brown 5258d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5259d71ae5a4SJacob Faibussowitsch { 52609c8f2541SHong Zhang PetscFunctionBegin; 52619566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 52623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52639c8f2541SHong Zhang } 52649c8f2541SHong Zhang 526581824310SBarry Smith /* 526653dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 526753dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 526853dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 526953dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 527053dd7562SDmitry Karpeev */ 5271d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5272d71ae5a4SJacob Faibussowitsch { 527353dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 527453dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 527553dd7562SDmitry Karpeev PetscBool seqaij; 527653dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 527753dd7562SDmitry Karpeev PetscScalar v; 527853dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 527953dd7562SDmitry Karpeev 528053dd7562SDmitry Karpeev PetscFunctionBegin; 52813ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 528253dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 52839566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 528428b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 528553dd7562SDmitry Karpeev if (rowemb) { 52869566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 528708401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 528853dd7562SDmitry Karpeev } else { 528908401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 529053dd7562SDmitry Karpeev } 529153dd7562SDmitry Karpeev if (colemb) { 52929566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 529308401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 529453dd7562SDmitry Karpeev } else { 529508401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 529653dd7562SDmitry Karpeev } 529753dd7562SDmitry Karpeev 529853dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 529953dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5301ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 53029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53039566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 530453dd7562SDmitry Karpeev } 530548a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 530653dd7562SDmitry Karpeev count = 0; 530753dd7562SDmitry Karpeev rowindices = NULL; 530853dd7562SDmitry Karpeev colindices = NULL; 530948a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 531048a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 531153dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 531253dd7562SDmitry Karpeev PetscInt row; 531353dd7562SDmitry Karpeev row = i; 531453dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 531553dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 531653dd7562SDmitry Karpeev PetscInt col; 531753dd7562SDmitry Karpeev col = Baij->j[count]; 531853dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 531953dd7562SDmitry Karpeev v = Baij->a[count]; 53209566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 532153dd7562SDmitry Karpeev ++count; 532253dd7562SDmitry Karpeev } 532353dd7562SDmitry Karpeev } 532453dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 532553dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 532653dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 532753dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 532853dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 53293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 533053dd7562SDmitry Karpeev } 533153dd7562SDmitry Karpeev 5332dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A) 5333dec0b466SHong Zhang { 5334dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5335dec0b466SHong Zhang MatScalar *aa = a->a; 5336dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5337dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5338dec0b466SHong Zhang 5339dec0b466SHong Zhang PetscFunctionBegin; 5340dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5341dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5342dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5343dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5344dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 5345dec0b466SHong Zhang if (aa[k] == 0 && aj[k] != i - 1) fshift++; 5346dec0b466SHong Zhang else { 5347dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5348dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5349dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5350dec0b466SHong Zhang } 5351dec0b466SHong Zhang } 5352dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5353dec0b466SHong Zhang fshift_prev = fshift; 5354dec0b466SHong Zhang /* reset ilen and imax for each row */ 5355dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5356dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5357dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5358dec0b466SHong Zhang } 5359dec0b466SHong Zhang if (m) { 5360dec0b466SHong Zhang ai[m] -= fshift; 5361dec0b466SHong Zhang a->nz = ai[m]; 5362dec0b466SHong Zhang } 5363dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5364dec0b466SHong Zhang A->nonzerostate -= fshift; 5365dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5366dec0b466SHong Zhang a->rmax = rmax; 5367dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5368dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5369dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 53703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5371dec0b466SHong Zhang } 5372dec0b466SHong Zhang 53734099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53744099cc6bSBarry Smith 53754099cc6bSBarry Smith /*@C 537611a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 53774099cc6bSBarry Smith 5378c3339decSBarry Smith Collective 53794099cc6bSBarry Smith 53804099cc6bSBarry Smith Input Parameters: 53814099cc6bSBarry Smith + mat - the matrix object 53824099cc6bSBarry Smith - matype - matrix type 53834099cc6bSBarry Smith 53844099cc6bSBarry Smith Options Database Key: 53854e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 53864099cc6bSBarry Smith 53874099cc6bSBarry Smith Level: intermediate 53884099cc6bSBarry Smith 53891cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat` 53904099cc6bSBarry Smith @*/ 5391d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5392d71ae5a4SJacob Faibussowitsch { 53934099cc6bSBarry Smith PetscBool sametype; 53945f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 53954099cc6bSBarry Smith 53964099cc6bSBarry Smith PetscFunctionBegin; 53974099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 53989566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 53993ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 54004099cc6bSBarry Smith 54019566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 54025f80ce2aSJacob Faibussowitsch PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 54039566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 54043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54054099cc6bSBarry Smith } 54064099cc6bSBarry Smith 54074099cc6bSBarry Smith /*@C 540811a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 54094099cc6bSBarry Smith 54104099cc6bSBarry Smith Not Collective 54114099cc6bSBarry Smith 54124099cc6bSBarry Smith Input Parameters: 541311a5261eSBarry Smith + name - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54144099cc6bSBarry Smith - function - routine to convert to subtype 54154099cc6bSBarry Smith 54162ef1f0ffSBarry Smith Level: advanced 54172ef1f0ffSBarry Smith 54184099cc6bSBarry Smith Notes: 541911a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54204099cc6bSBarry Smith 54214099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54224099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54234099cc6bSBarry Smith 54241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 54254099cc6bSBarry Smith @*/ 5426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5427d71ae5a4SJacob Faibussowitsch { 54284099cc6bSBarry Smith PetscFunctionBegin; 54299566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54309566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54324099cc6bSBarry Smith } 54334099cc6bSBarry Smith 54344099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54354099cc6bSBarry Smith 54364099cc6bSBarry Smith /*@C 543711a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54384099cc6bSBarry Smith 54394099cc6bSBarry Smith Not Collective 54404099cc6bSBarry Smith 54414099cc6bSBarry Smith Level: advanced 54424099cc6bSBarry Smith 54432ef1f0ffSBarry Smith Note: 54442ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 54452ef1f0ffSBarry Smith 54461cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 54474099cc6bSBarry Smith @*/ 5448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5449d71ae5a4SJacob Faibussowitsch { 54504099cc6bSBarry Smith PetscFunctionBegin; 54513ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 54524099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54534099cc6bSBarry Smith 54549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54579779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5459485f9817SRichard Tran Mills #endif 54605063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54625063d097SStefano Zampini #endif 5463d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5464d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5465d5e393b6SSuyash Tandon #endif 54665063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54685063d097SStefano Zampini #endif 54694099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54714099cc6bSBarry Smith #endif 54723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54734099cc6bSBarry Smith } 547453dd7562SDmitry Karpeev 547553dd7562SDmitry Karpeev /* 547681824310SBarry Smith Special version for direct calls from Fortran 547781824310SBarry Smith */ 5478af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 547981824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 548081824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 548181824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 548281824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 548381824310SBarry Smith #endif 548481824310SBarry Smith 548581824310SBarry Smith /* Change these macros so can be used in void function */ 548698921bdaSJacob Faibussowitsch 548798921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54889566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54899566063dSJacob Faibussowitsch #undef PetscCall 54909371c9d4SSatish Balay #define PetscCall(...) \ 54919371c9d4SSatish Balay do { \ 54925f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 549398921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 549498921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 549598921bdaSJacob Faibussowitsch return; \ 549698921bdaSJacob Faibussowitsch } \ 549798921bdaSJacob Faibussowitsch } while (0) 549898921bdaSJacob Faibussowitsch 549998921bdaSJacob Faibussowitsch #undef SETERRQ 55009371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 55019371c9d4SSatish Balay do { \ 550298921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 550398921bdaSJacob Faibussowitsch return; \ 550498921bdaSJacob Faibussowitsch } while (0) 550581824310SBarry Smith 5506d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5507d71ae5a4SJacob Faibussowitsch { 550881824310SBarry Smith Mat A = *AA; 550981824310SBarry Smith PetscInt m = *mm, n = *nn; 551081824310SBarry Smith InsertMode is = *isis; 551181824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 551281824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 551381824310SBarry Smith PetscInt *imax, *ai, *ailen; 551481824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 551554f21887SBarry Smith MatScalar *ap, value, *aa; 5516ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5517ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 551881824310SBarry Smith 551981824310SBarry Smith PetscFunctionBegin; 55204994cf47SJed Brown MatCheckPreallocated(A, 1); 552181824310SBarry Smith imax = a->imax; 552281824310SBarry Smith ai = a->i; 552381824310SBarry Smith ailen = a->ilen; 552481824310SBarry Smith aj = a->j; 552581824310SBarry Smith aa = a->a; 552681824310SBarry Smith 552781824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 552881824310SBarry Smith row = im[k]; 552981824310SBarry Smith if (row < 0) continue; 55305f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55319371c9d4SSatish Balay rp = aj + ai[row]; 55329371c9d4SSatish Balay ap = aa + ai[row]; 55339371c9d4SSatish Balay rmax = imax[row]; 55349371c9d4SSatish Balay nrow = ailen[row]; 553581824310SBarry Smith low = 0; 553681824310SBarry Smith high = nrow; 553781824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 553881824310SBarry Smith if (in[l] < 0) continue; 55395f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 554081824310SBarry Smith col = in[l]; 55412205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55422205254eSKarl Rupp else value = v[k + l * m]; 55432205254eSKarl Rupp 554481824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 554581824310SBarry Smith 55462205254eSKarl Rupp if (col <= lastcol) low = 0; 55472205254eSKarl Rupp else high = nrow; 554881824310SBarry Smith lastcol = col; 554981824310SBarry Smith while (high - low > 5) { 555081824310SBarry Smith t = (low + high) / 2; 555181824310SBarry Smith if (rp[t] > col) high = t; 555281824310SBarry Smith else low = t; 555381824310SBarry Smith } 555481824310SBarry Smith for (i = low; i < high; i++) { 555581824310SBarry Smith if (rp[i] > col) break; 555681824310SBarry Smith if (rp[i] == col) { 555781824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 555881824310SBarry Smith else ap[i] = value; 555981824310SBarry Smith goto noinsert; 556081824310SBarry Smith } 556181824310SBarry Smith } 556281824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 556381824310SBarry Smith if (nonew == 1) goto noinsert; 55645f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5565fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 55669371c9d4SSatish Balay N = nrow++ - 1; 55679371c9d4SSatish Balay a->nz++; 55689371c9d4SSatish Balay high++; 556981824310SBarry Smith /* shift up all the later entries in this row */ 557081824310SBarry Smith for (ii = N; ii >= i; ii--) { 557181824310SBarry Smith rp[ii + 1] = rp[ii]; 557281824310SBarry Smith ap[ii + 1] = ap[ii]; 557381824310SBarry Smith } 557481824310SBarry Smith rp[i] = col; 557581824310SBarry Smith ap[i] = value; 5576e56f5c9eSBarry Smith A->nonzerostate++; 557781824310SBarry Smith noinsert:; 557881824310SBarry Smith low = i + 1; 557981824310SBarry Smith } 558081824310SBarry Smith ailen[row] = nrow; 558181824310SBarry Smith } 558281824310SBarry Smith PetscFunctionReturnVoid(); 558381824310SBarry Smith } 558498921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 558598921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 558698921bdaSJacob Faibussowitsch * original definitions */ 55879566063dSJacob Faibussowitsch #undef PetscCall 558898921bdaSJacob Faibussowitsch #undef SETERRQ 5589