1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 57748a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 5809566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 666e457bb90SBarry Smith if (PetscDefined(USE_DEBUG)) { 667e457bb90SBarry Smith PetscInt mnz = 0; 668e457bb90SBarry Smith 669e457bb90SBarry Smith for (i = 0; i < m; i++) mnz += rowlens[i]; 670e457bb90SBarry Smith PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz); 671e457bb90SBarry Smith } 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 702ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 703d71ae5a4SJacob Faibussowitsch { 704416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 705c898d852SStefano Zampini const PetscScalar *av; 70660e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 707e060cb09SBarry Smith const char *name; 708f3ef73ceSBarry Smith PetscViewerFormat format; 70917ab2063SBarry Smith 7103a40ed3dSBarry Smith PetscFunctionBegin; 7117dc0baabSHong Zhang if (A->structure_only) { 7129566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7147dc0baabSHong Zhang } 71543e49210SHong Zhang 7169566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 717bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7183ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7192e5835c6SStefano Zampini 720c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72371c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72497f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72560e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 726c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 727d00d2cf4SBarry Smith nofinalvalue = 1; 728d00d2cf4SBarry Smith } 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 732fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 734fbfe6fa7SJed Brown #else 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #endif 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73817ab2063SBarry Smith 73917ab2063SBarry Smith for (i = 0; i < m; i++) { 74060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 741aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74317ab2063SBarry Smith #else 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74517ab2063SBarry Smith #endif 74617ab2063SBarry Smith } 74717ab2063SBarry Smith } 748d00d2cf4SBarry Smith if (nofinalvalue) { 749c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 751c337ccceSJed Brown #else 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 753c337ccceSJed Brown #endif 754d00d2cf4SBarry Smith } 7559566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 758fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76044cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 763aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7706831982aSBarry Smith } 77144cd7ae7SLois Curfman McInnes #else 7729566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77344cd7ae7SLois Curfman McInnes #endif 77444cd7ae7SLois Curfman McInnes } 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 778fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77997f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 782496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 783496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 785496be53dSLois Curfman McInnes if (a->j[j] >= i) { 786aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 788496be53dSLois Curfman McInnes #else 789496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 790496be53dSLois Curfman McInnes #endif 791496be53dSLois Curfman McInnes } 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 7942e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7962e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7972205254eSKarl Rupp if (i + 4 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7992205254eSKarl Rupp } else if (i + 3 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8012205254eSKarl Rupp } else if (i + 2 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8032205254eSKarl Rupp } else if (i + 1 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8052205254eSKarl Rupp } else if (i < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8072205254eSKarl Rupp } else { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8092205254eSKarl Rupp } 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8129566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 813496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8159566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 816496be53dSLois Curfman McInnes } 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 822496be53dSLois Curfman McInnes if (a->j[j] >= i) { 823aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82448a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 825496be53dSLois Curfman McInnes #else 8269566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 827496be53dSLois Curfman McInnes #endif 828496be53dSLois Curfman McInnes } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 833fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83497f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83587828ca2SBarry Smith PetscScalar value; 83668f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83768f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83868f1ed48SBarry Smith 83968f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84068f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84168f1ed48SBarry Smith realonly = PETSC_FALSE; 84268f1ed48SBarry Smith break; 84368f1ed48SBarry Smith } 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith #endif 84602594712SBarry Smith 8479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84802594712SBarry Smith for (i = 0; i < m; i++) { 84902594712SBarry Smith jcnt = 0; 850d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 851e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85202594712SBarry Smith value = a->a[cnt++]; 853e24b481bSBarry Smith jcnt++; 85402594712SBarry Smith } else { 85502594712SBarry Smith value = 0.0; 85602594712SBarry Smith } 857aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith if (realonly) { 8599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86068f1ed48SBarry Smith } else { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86268f1ed48SBarry Smith } 86302594712SBarry Smith #else 8649566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86502594712SBarry Smith #endif 86602594712SBarry Smith } 8679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8703c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 871150b93efSMatthew G. Knepley PetscInt fshift = 1; 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8733c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8753c215bfdSMatthew Knepley #else 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8773c215bfdSMatthew Knepley #endif 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8793c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8813c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8833c215bfdSMatthew Knepley #else 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8853c215bfdSMatthew Knepley #endif 8863c215bfdSMatthew Knepley } 8873c215bfdSMatthew Knepley } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8893a40ed3dSBarry Smith } else { 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 891d5f3da31SBarry Smith if (A->factortype) { 89216cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89416cd7e1dSShri Abhyankar /* L part */ 89560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90116cd7e1dSShri Abhyankar } else { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90316cd7e1dSShri Abhyankar } 90416cd7e1dSShri Abhyankar #else 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90616cd7e1dSShri Abhyankar #endif 90716cd7e1dSShri Abhyankar } 90816cd7e1dSShri Abhyankar /* diagonal */ 90916cd7e1dSShri Abhyankar j = a->diag[i]; 91016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 912835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j]))); 91316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 914835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j])))); 91516cd7e1dSShri Abhyankar } else { 916835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j]))); 91716cd7e1dSShri Abhyankar } 91816cd7e1dSShri Abhyankar #else 919835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j]))); 92016cd7e1dSShri Abhyankar #endif 92116cd7e1dSShri Abhyankar 92216cd7e1dSShri Abhyankar /* U part */ 92360e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92916cd7e1dSShri Abhyankar } else { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar #else 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93416cd7e1dSShri Abhyankar #endif 93516cd7e1dSShri Abhyankar } 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93716cd7e1dSShri Abhyankar } 93816cd7e1dSShri Abhyankar } else { 93917ab2063SBarry Smith for (i = 0; i < m; i++) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 942aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9473a40ed3dSBarry Smith } else { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94917ab2063SBarry Smith } 95017ab2063SBarry Smith #else 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95217ab2063SBarry Smith #endif 95317ab2063SBarry Smith } 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95517ab2063SBarry Smith } 95616cd7e1dSShri Abhyankar } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95817ab2063SBarry Smith } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 961416022c9SBarry Smith } 962416022c9SBarry Smith 9639804daf3SBarry Smith #include <petscdraw.h> 964ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 965d71ae5a4SJacob Faibussowitsch { 966480ef9eaSBarry Smith Mat A = (Mat)Aa; 967416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 968383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 969383922c3SLisandro Dalcin int color; 970b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 971b0a32e0cSBarry Smith PetscViewer viewer; 972f3ef73ceSBarry Smith PetscViewerFormat format; 973fff043a9SJunchao Zhang const PetscScalar *aa; 974cddf8d76SBarry Smith 9753a40ed3dSBarry Smith PetscFunctionBegin; 9769566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9779566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9789566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 979383922c3SLisandro Dalcin 980416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 982fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 983d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9840513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 985b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 986416022c9SBarry Smith for (i = 0; i < m; i++) { 9879371c9d4SSatish Balay y_l = m - i - 1.0; 9889371c9d4SSatish Balay y_r = y_l + 1.0; 989bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9909371c9d4SSatish Balay x_l = a->j[j]; 9919371c9d4SSatish Balay x_r = x_l + 1.0; 992fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9939566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 994cddf8d76SBarry Smith } 995cddf8d76SBarry Smith } 996b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 997cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9989371c9d4SSatish Balay y_l = m - i - 1.0; 9999371c9d4SSatish Balay y_r = y_l + 1.0; 1000bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10019371c9d4SSatish Balay x_l = a->j[j]; 10029371c9d4SSatish Balay x_r = x_l + 1.0; 1003fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10049566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1005cddf8d76SBarry Smith } 1006cddf8d76SBarry Smith } 1007b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1008cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10099371c9d4SSatish Balay y_l = m - i - 1.0; 10109371c9d4SSatish Balay y_r = y_l + 1.0; 1011bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10129371c9d4SSatish Balay x_l = a->j[j]; 10139371c9d4SSatish Balay x_r = x_l + 1.0; 1014fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10159566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1016416022c9SBarry Smith } 1017416022c9SBarry Smith } 1018d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10190513a670SBarry Smith } else { 10200513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10210513a670SBarry Smith /* first determine max of all nonzero values */ 1022b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1023383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1024b0a32e0cSBarry Smith PetscDraw popup; 10250513a670SBarry Smith 10260513a670SBarry Smith for (i = 0; i < nz; i++) { 1027fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10280513a670SBarry Smith } 1029383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10309566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1032383922c3SLisandro Dalcin 1033d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10340513a670SBarry Smith for (i = 0; i < m; i++) { 1035383922c3SLisandro Dalcin y_l = m - i - 1.0; 1036383922c3SLisandro Dalcin y_r = y_l + 1.0; 1037bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1038383922c3SLisandro Dalcin x_l = a->j[j]; 1039383922c3SLisandro Dalcin x_r = x_l + 1.0; 1040fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10419566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10420513a670SBarry Smith count++; 10430513a670SBarry Smith } 10440513a670SBarry Smith } 1045d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10460513a670SBarry Smith } 10479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1049480ef9eaSBarry Smith } 1050cddf8d76SBarry Smith 10519804daf3SBarry Smith #include <petscdraw.h> 1052ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1053d71ae5a4SJacob Faibussowitsch { 1054b0a32e0cSBarry Smith PetscDraw draw; 105536db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1056ace3abfcSBarry Smith PetscBool isnull; 1057480ef9eaSBarry Smith 1058480ef9eaSBarry Smith PetscFunctionBegin; 10599566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10609566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10613ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1062480ef9eaSBarry Smith 10639371c9d4SSatish Balay xr = A->cmap->n; 10649371c9d4SSatish Balay yr = A->rmap->n; 10659371c9d4SSatish Balay h = yr / 10.0; 10669371c9d4SSatish Balay w = xr / 10.0; 10679371c9d4SSatish Balay xr += w; 10689371c9d4SSatish Balay yr += h; 10699371c9d4SSatish Balay xl = -w; 10709371c9d4SSatish Balay yl = -h; 10719566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10729566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1077416022c9SBarry Smith } 1078416022c9SBarry Smith 1079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1080d71ae5a4SJacob Faibussowitsch { 1081ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1082416022c9SBarry Smith 10833a40ed3dSBarry Smith PetscFunctionBegin; 10849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10871baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10881baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10891baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10909566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109217ab2063SBarry Smith } 109319bcc07fSBarry Smith 1094d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1095d71ae5a4SJacob Faibussowitsch { 1096416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1097580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1098bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 109954f21887SBarry Smith MatScalar *aa = a->a, *ap; 11003447b6efSHong Zhang PetscReal ratio = 0.6; 110117ab2063SBarry Smith 11023a40ed3dSBarry Smith PetscFunctionBegin; 11033ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1105b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1106b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11079566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1109b215bc84SStefano Zampini } 111017ab2063SBarry Smith 111143ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111217ab2063SBarry Smith for (i = 1; i < m; i++) { 1113416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111417ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111594a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111617ab2063SBarry Smith if (fshift) { 1117bfeeae90SHong Zhang ip = aj + ai[i]; 1118bfeeae90SHong Zhang ap = aa + ai[i]; 111917ab2063SBarry Smith N = ailen[i]; 11209566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112148a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112217ab2063SBarry Smith } 112317ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112417ab2063SBarry Smith } 112517ab2063SBarry Smith if (m) { 112617ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112717ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112817ab2063SBarry Smith } 112917ab2063SBarry Smith /* reset ilen and imax for each row */ 11307b083b7cSBarry Smith a->nonzerorowcnt = 0; 1131396832f4SHong Zhang if (A->structure_only) { 11329566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1134396832f4SHong Zhang } else { /* !A->structure_only */ 113517ab2063SBarry Smith for (i = 0; i < m; i++) { 113617ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11377b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113817ab2063SBarry Smith } 1139396832f4SHong Zhang } 1140bfeeae90SHong Zhang a->nz = ai[m]; 1141aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1142bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1143bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1144bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1145bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1146bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1147bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1148bc43efbbSJunchao Zhang break; 1149bc43efbbSJunchao Zhang } 1150bc43efbbSJunchao Zhang } 11519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11542205254eSKarl Rupp 11558e58a170SBarry Smith A->info.mallocs += a->reallocs; 1156dd5f02e7SSatish Balay a->reallocs = 0; 11576712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115836db0b34SBarry Smith a->rmax = rmax; 11594e220ebcSLois Curfman McInnes 116048a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11619566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116317ab2063SBarry Smith } 116417ab2063SBarry Smith 1165ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1166d71ae5a4SJacob Faibussowitsch { 116799cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116899cafbc1SBarry Smith PetscInt i, nz = a->nz; 11692e5835c6SStefano Zampini MatScalar *aa; 117099cafbc1SBarry Smith 117199cafbc1SBarry Smith PetscFunctionBegin; 11729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117399cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117799cafbc1SBarry Smith } 117899cafbc1SBarry Smith 1179ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1180d71ae5a4SJacob Faibussowitsch { 118199cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118299cafbc1SBarry Smith PetscInt i, nz = a->nz; 11832e5835c6SStefano Zampini MatScalar *aa; 118499cafbc1SBarry Smith 118599cafbc1SBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118799cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119199cafbc1SBarry Smith } 119299cafbc1SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1194d71ae5a4SJacob Faibussowitsch { 1195fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1196fff043a9SJunchao Zhang MatScalar *aa; 11973a40ed3dSBarry Smith 11983a40ed3dSBarry Smith PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12009566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120417ab2063SBarry Smith } 1205416022c9SBarry Smith 1206674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A) 1207d71ae5a4SJacob Faibussowitsch { 1208416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1209d5d45c9bSBarry Smith 12103a40ed3dSBarry Smith PetscFunctionBegin; 1211b4e2f619SBarry Smith if (A->hash_active) { 1212e3c72094SPierre Jolivet A->ops[0] = a->cops; 1213b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1214b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1215b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1216b4e2f619SBarry Smith } 1217b4e2f619SBarry Smith 12183ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12199566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12209566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12299566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12309566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12329566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 1233674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1234674b392bSAlexander } 1235674b392bSAlexander 1236674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A) 1237674b392bSAlexander { 1238674b392bSAlexander PetscFunctionBegin; 1239674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 1240674b392bSAlexander PetscCall(MatCreate_SeqAIJ_Inode(A)); 1241674b392bSAlexander PetscCall(MatSetUp_Seq_Hash(A)); 1242674b392bSAlexander A->nonzerostate++; 1243674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1244674b392bSAlexander } 1245674b392bSAlexander 1246674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1247674b392bSAlexander { 1248674b392bSAlexander PetscFunctionBegin; 1249674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 12509566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1251901853e0SKris Buschelman 12526718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12536718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12546718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12556718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12566718818eSStefano Zampini due to different matrix sizes */ 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12586718818eSStefano Zampini 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12602e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12612e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12682e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12692e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12702e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12712e956fe4SStefano Zampini #endif 12724222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12764222ddf1SHong Zhang #endif 1277d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1278d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1279d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1280d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1281d5e393b6SSuyash Tandon #endif 12823d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12843d0639e7SStefano Zampini #endif 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1286af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1288af8000cdSHong Zhang #endif 1289d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1291d24d4204SJose E. Roman #endif 129263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 129563c07aadSStefano Zampini #endif 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 13029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 1303674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL)); 13049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 13059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 13069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 13079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 13089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 13099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 13109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 13119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 13122e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 13132e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13142e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 13152e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13162e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13172e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13182e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 132017ab2063SBarry Smith } 132117ab2063SBarry Smith 1322d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1323d71ae5a4SJacob Faibussowitsch { 1324416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13253a40ed3dSBarry Smith 13263a40ed3dSBarry Smith PetscFunctionBegin; 1327a65d3064SKris Buschelman switch (op) { 1328d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1329d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1330d71ae5a4SJacob Faibussowitsch break; 1331d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1332d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1333d71ae5a4SJacob Faibussowitsch break; 1334d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1335d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1336d71ae5a4SJacob Faibussowitsch break; 1337d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1338d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1339d71ae5a4SJacob Faibussowitsch break; 1340d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1341d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1342d71ae5a4SJacob Faibussowitsch break; 1343d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1344d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1345d71ae5a4SJacob Faibussowitsch break; 1346d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1347d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1348d71ae5a4SJacob Faibussowitsch break; 1349d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1350d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1351d71ae5a4SJacob Faibussowitsch break; 1352d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1353d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1354d71ae5a4SJacob Faibussowitsch break; 1355071fcb05SBarry Smith case MAT_SORTED_FULL: 1356071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1357071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1358071fcb05SBarry Smith break; 1359d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1360d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1361d71ae5a4SJacob Faibussowitsch break; 1362d71ae5a4SJacob Faibussowitsch default: 1363888c827cSStefano Zampini break; 1364a65d3064SKris Buschelman } 13653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136617ab2063SBarry Smith } 136717ab2063SBarry Smith 1368ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1369d71ae5a4SJacob Faibussowitsch { 1370416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1371fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1372c898d852SStefano Zampini PetscScalar *x; 1373c898d852SStefano Zampini const PetscScalar *aa; 137417ab2063SBarry Smith 13753a40ed3dSBarry Smith PetscFunctionBegin; 13769566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137708401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1379d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1380d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13819566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13822c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13839566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138635e7444dSHong Zhang } 138735e7444dSHong Zhang 13889566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138935e7444dSHong Zhang for (i = 0; i < n; i++) { 1390fdc842d1SBarry Smith x[i] = 0.0; 139135e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139235e7444dSHong Zhang if (aj[j] == i) { 139335e7444dSHong Zhang x[i] = aa[j]; 139417ab2063SBarry Smith break; 139517ab2063SBarry Smith } 139617ab2063SBarry Smith } 139717ab2063SBarry Smith } 13989566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 140117ab2063SBarry Smith } 140217ab2063SBarry Smith 1403c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1404d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1405d71ae5a4SJacob Faibussowitsch { 1406416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14075f22a7b3SSebastian Grimberg const MatScalar *aa; 1408d9ca1df4SBarry Smith PetscScalar *y; 1409d9ca1df4SBarry Smith const PetscScalar *x; 1410d0f46423SBarry Smith PetscInt m = A->rmap->n; 14115c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14125f22a7b3SSebastian Grimberg const MatScalar *v; 1413a77337e4SBarry Smith PetscScalar alpha; 1414d9ca1df4SBarry Smith PetscInt n, i, j; 1415d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14163447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1417ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14185c897100SBarry Smith #endif 141917ab2063SBarry Smith 14203a40ed3dSBarry Smith PetscFunctionBegin; 14219566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14229566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14239566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14255c897100SBarry Smith 14265c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1427fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14285c897100SBarry Smith #else 14293447b6efSHong Zhang if (usecprow) { 14303447b6efSHong Zhang m = cprow.nrows; 14313447b6efSHong Zhang ii = cprow.i; 14327b2bb3b9SHong Zhang ridx = cprow.rindex; 14333447b6efSHong Zhang } else { 14343447b6efSHong Zhang ii = a->i; 14353447b6efSHong Zhang } 143617ab2063SBarry Smith for (i = 0; i < m; i++) { 14373447b6efSHong Zhang idx = a->j + ii[i]; 1438fff043a9SJunchao Zhang v = aa + ii[i]; 14393447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14403447b6efSHong Zhang if (usecprow) { 14417b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14423447b6efSHong Zhang } else { 144317ab2063SBarry Smith alpha = x[i]; 14443447b6efSHong Zhang } 144504fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144617ab2063SBarry Smith } 14475c897100SBarry Smith #endif 14489566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14499566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14509566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145317ab2063SBarry Smith } 145417ab2063SBarry Smith 1455d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1456d71ae5a4SJacob Faibussowitsch { 14575c897100SBarry Smith PetscFunctionBegin; 14589566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14599566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14615c897100SBarry Smith } 14625c897100SBarry Smith 1463c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146478b84d54SShri Abhyankar 1465d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1466d71ae5a4SJacob Faibussowitsch { 1467416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1468d9fead3dSBarry Smith PetscScalar *y; 146954f21887SBarry Smith const PetscScalar *x; 14705914357eSBarry Smith const MatScalar *a_a; 1471003131ecSBarry Smith PetscInt m = A->rmap->n; 14725914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1473ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147417ab2063SBarry Smith 1475b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147697952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1477fee21e36SBarry Smith #endif 1478fee21e36SBarry Smith 14793a40ed3dSBarry Smith PetscFunctionBegin; 1480b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14819566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1483b215bc84SStefano Zampini } 14849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14869566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1487416022c9SBarry Smith ii = a->i; 14884eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14899566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149097952fefSHong Zhang m = a->compressedrow.nrows; 149197952fefSHong Zhang ii = a->compressedrow.i; 149297952fefSHong Zhang ridx = a->compressedrow.rindex; 14935914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14945914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 14955914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 14965914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 14975914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 14985914357eSBarry Smith PetscScalar sum = 0.0; 1499003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1500003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1501c9a1b032SJunchao Zhang y[ridx[i]] = sum; 150297952fefSHong Zhang } 150397952fefSHong Zhang } else { /* do not use compressed row format */ 1504b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15055914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1506b05257ddSBarry Smith #else 15075914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15085914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15095914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15105914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15115914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15125914357eSBarry Smith PetscScalar sum = 0.0; 1513003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151417ab2063SBarry Smith y[i] = sum; 151517ab2063SBarry Smith } 15168d195f9aSBarry Smith #endif 1517b05257ddSBarry Smith } 15189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 1525ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1526ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1527d71ae5a4SJacob Faibussowitsch { 1528b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1529b434eb95SMatthew G. Knepley PetscScalar *y; 1530b434eb95SMatthew G. Knepley const PetscScalar *x; 1531fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1532b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1533b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1534b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1535b434eb95SMatthew G. Knepley PetscScalar sum; 1536b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1537b434eb95SMatthew G. Knepley 1538b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1539b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1540b434eb95SMatthew G. Knepley #endif 1541b434eb95SMatthew G. Knepley 1542b434eb95SMatthew G. Knepley PetscFunctionBegin; 15439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15459566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1546b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1547b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1548b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1549b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1550b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1551b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1552b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1553fff043a9SJunchao Zhang aa = a_a + ii[i]; 1554b434eb95SMatthew G. Knepley sum = 0.0; 1555b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1556b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1557b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1558b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1559b434eb95SMatthew G. Knepley } 1560b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15613d3eaba7SBarry Smith ii = a->i; 1562b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1563b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1564b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1565fff043a9SJunchao Zhang aa = a_a + ii[i]; 1566b434eb95SMatthew G. Knepley sum = 0.0; 1567b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1568b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1569b434eb95SMatthew G. Knepley y[i] = sum; 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley } 15729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15749566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1577b434eb95SMatthew G. Knepley } 1578b434eb95SMatthew G. Knepley 1579ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1580ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1581d71ae5a4SJacob Faibussowitsch { 1582b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1583b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1584b434eb95SMatthew G. Knepley const PetscScalar *x; 1585fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1586b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1587b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1588b434eb95SMatthew G. Knepley PetscScalar sum; 1589b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1590b434eb95SMatthew G. Knepley 1591b434eb95SMatthew G. Knepley PetscFunctionBegin; 15929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15939566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15949566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1595b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1597b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1598b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1599b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1600b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1601b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1602b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1603fff043a9SJunchao Zhang aa = a_a + ii[i]; 1604b434eb95SMatthew G. Knepley sum = y[*ridx]; 1605b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1606b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1607b434eb95SMatthew G. Knepley } 1608b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16093d3eaba7SBarry Smith ii = a->i; 1610b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1611b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1612b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1613fff043a9SJunchao Zhang aa = a_a + ii[i]; 1614b434eb95SMatthew G. Knepley sum = y[i]; 1615b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1616b434eb95SMatthew G. Knepley z[i] = sum; 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley } 16199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1624b434eb95SMatthew G. Knepley } 1625b434eb95SMatthew G. Knepley 1626c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1627d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1628d71ae5a4SJacob Faibussowitsch { 1629416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1630f15663dcSBarry Smith PetscScalar *y, *z; 1631f15663dcSBarry Smith const PetscScalar *x; 16325914357eSBarry Smith const MatScalar *a_a; 16335914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16345914357eSBarry Smith PetscInt m = A->rmap->n; 1635ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16369ea0dfa2SSatish Balay 16373a40ed3dSBarry Smith PetscFunctionBegin; 1638b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16399566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1641b215bc84SStefano Zampini } 16429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16449566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16454eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164797952fefSHong Zhang m = a->compressedrow.nrows; 164897952fefSHong Zhang ii = a->compressedrow.i; 164997952fefSHong Zhang ridx = a->compressedrow.rindex; 16505914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16515914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16525914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16535914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16545914357eSBarry Smith PetscScalar sum = y[*ridx]; 1655f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165697952fefSHong Zhang z[*ridx++] = sum; 165797952fefSHong Zhang } 165897952fefSHong Zhang } else { /* do not use compressed row format */ 16593d3eaba7SBarry Smith ii = a->i; 1660f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16615914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1662f15663dcSBarry Smith #else 16635914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16645914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16655914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16665914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16675914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16685914357eSBarry Smith PetscScalar sum = y[i]; 1669f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167017ab2063SBarry Smith z[i] = sum; 167117ab2063SBarry Smith } 167202ab625aSSatish Balay #endif 1673f15663dcSBarry Smith } 16749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167917ab2063SBarry Smith } 168017ab2063SBarry Smith 168117ab2063SBarry Smith /* 16820b4b7b1cSBarry Smith Adds diagonal pointers to sparse matrix nonzero structure. 168317ab2063SBarry Smith */ 1684d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1685d71ae5a4SJacob Faibussowitsch { 1686416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1687d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1688c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168917ab2063SBarry Smith 16903a40ed3dSBarry Smith PetscFunctionBegin; 169109f38230SBarry Smith if (!a->diag) { 16929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1693c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169409f38230SBarry Smith } 1695d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1696c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1697c0c07093SJunchao Zhang if (alreadySet) { 1698c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1699c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1700c0c07093SJunchao Zhang } 1701c0c07093SJunchao Zhang 170209f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1703bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1704bfeeae90SHong Zhang if (a->j[j] == i) { 170509f38230SBarry Smith a->diag[i] = j; 170617ab2063SBarry Smith break; 170717ab2063SBarry Smith } 170817ab2063SBarry Smith } 170917ab2063SBarry Smith } 17103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171117ab2063SBarry Smith } 171217ab2063SBarry Smith 1713ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1714d71ae5a4SJacob Faibussowitsch { 171561ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171661ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171761ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171861ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171961ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172061ecd0c6SBarry Smith 172161ecd0c6SBarry Smith PetscFunctionBegin; 172261ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17249566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172661ecd0c6SBarry Smith } 172761ecd0c6SBarry Smith 172861ecd0c6SBarry Smith if (a->diagonaldense) { 172961ecd0c6SBarry Smith cnt = 0; 173061ecd0c6SBarry Smith } else { 17319566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173261ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1733349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173461ecd0c6SBarry Smith cnt++; 173561ecd0c6SBarry Smith mdiag[i] = 1; 173661ecd0c6SBarry Smith } 173761ecd0c6SBarry Smith } 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith if (!cnt) { 17409566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174161ecd0c6SBarry Smith } else { 1742b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1743b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 17449f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 17456ea2a7edSJunchao Zhang const PetscScalar *Aa; 17466ea2a7edSJunchao Zhang 17476ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17486ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 174961ecd0c6SBarry Smith 175061ecd0c6SBarry Smith a->a = NULL; 175161ecd0c6SBarry Smith a->j = NULL; 175261ecd0c6SBarry Smith a->i = NULL; 175361ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1754ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175661ecd0c6SBarry Smith 175761ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175861ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17599566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176048a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1761447d62f5SStefano Zampini } 17629566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17639566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17649f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17659f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17669f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 176761ecd0c6SBarry Smith } 17689566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176961ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177161ecd0c6SBarry Smith } 177261ecd0c6SBarry Smith 1773be5855fcSBarry Smith /* 1774be5855fcSBarry Smith Checks for missing diagonals 1775be5855fcSBarry Smith */ 1776d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1777d71ae5a4SJacob Faibussowitsch { 1778be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17797734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1780be5855fcSBarry Smith 1781be5855fcSBarry Smith PetscFunctionBegin; 178209f38230SBarry Smith *missing = PETSC_FALSE; 17837734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 178409f38230SBarry Smith *missing = PETSC_TRUE; 178509f38230SBarry Smith if (d) *d = 0; 17869566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178709f38230SBarry Smith } else { 178801445905SHong Zhang PetscInt n; 178901445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1790f1e2ffcdSBarry Smith diag = a->diag; 179101445905SHong Zhang for (i = 0; i < n; i++) { 17927734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179309f38230SBarry Smith *missing = PETSC_TRUE; 179409f38230SBarry Smith if (d) *d = i; 17959566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1796358d2f5dSShri Abhyankar break; 179709f38230SBarry Smith } 1798be5855fcSBarry Smith } 1799be5855fcSBarry Smith } 18003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1801be5855fcSBarry Smith } 1802be5855fcSBarry Smith 18030da83c2eSBarry Smith #include <petscblaslapack.h> 18040da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18050da83c2eSBarry Smith 18060da83c2eSBarry Smith /* 18070da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18080da83c2eSBarry Smith */ 1809ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1810d71ae5a4SJacob Faibussowitsch { 18110da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18120da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18130da83c2eSBarry Smith const PetscReal shift = 0.0; 18140da83c2eSBarry Smith PetscInt ipvt[5]; 18154e208921SJed Brown PetscCount flops = 0; 18160da83c2eSBarry Smith PetscScalar work[25], *v_work; 18170da83c2eSBarry Smith 18180da83c2eSBarry Smith PetscFunctionBegin; 18190da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18200da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182108401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1822ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 182448a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18250da83c2eSBarry Smith ncnt = 0; 18260da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18270da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18290da83c2eSBarry Smith switch (bsizes[i]) { 1830d71ae5a4SJacob Faibussowitsch case 1: 1831d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1832d71ae5a4SJacob Faibussowitsch break; 18330da83c2eSBarry Smith case 2: 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18350da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18370da83c2eSBarry Smith break; 18380da83c2eSBarry Smith case 3: 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18400da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18420da83c2eSBarry Smith break; 18430da83c2eSBarry Smith case 4: 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18450da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18470da83c2eSBarry Smith break; 18480da83c2eSBarry Smith case 5: 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18500da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18520da83c2eSBarry Smith break; 18530da83c2eSBarry Smith case 6: 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18550da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18570da83c2eSBarry Smith break; 18580da83c2eSBarry Smith case 7: 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18600da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18620da83c2eSBarry Smith break; 18630da83c2eSBarry Smith default: 18649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18650da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18670da83c2eSBarry Smith } 18680da83c2eSBarry Smith ncnt += bsizes[i]; 18690da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1870baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18710da83c2eSBarry Smith } 18723ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187348a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18749566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18760da83c2eSBarry Smith } 18770da83c2eSBarry Smith 1878422a814eSBarry Smith /* 1879422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1880422a814eSBarry Smith */ 1881ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1882d71ae5a4SJacob Faibussowitsch { 188371f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1884d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18852e5835c6SStefano Zampini const MatScalar *v; 188654f21887SBarry Smith PetscScalar *idiag, *mdiag; 188771f1c65dSBarry Smith 188871f1c65dSBarry Smith PetscFunctionBegin; 18893ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18909566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189171f1c65dSBarry Smith diag = a->diag; 18924dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18932e5835c6SStefano Zampini 189471f1c65dSBarry Smith mdiag = a->mdiag; 189571f1c65dSBarry Smith idiag = a->idiag; 18969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1897422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189871f1c65dSBarry Smith for (i = 0; i < m; i++) { 189971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1900899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1901899639b0SHong Zhang if (PetscRealPart(fshift)) { 19029566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19037b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19047b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19057b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 190698921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1907899639b0SHong Zhang } 190871f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190971f1c65dSBarry Smith } 19109566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191171f1c65dSBarry Smith } else { 191271f1c65dSBarry Smith for (i = 0; i < m; i++) { 191371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 191471f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 191571f1c65dSBarry Smith } 19169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191771f1c65dSBarry Smith } 191871f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192171f1c65dSBarry Smith } 192271f1c65dSBarry Smith 1923d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1924d71ae5a4SJacob Faibussowitsch { 1925416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1926e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19272e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192854f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19293d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193097f1f81fSBarry Smith const PetscInt *idx, *diag; 193117ab2063SBarry Smith 19323a40ed3dSBarry Smith PetscFunctionBegin; 1933b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19349566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1936b215bc84SStefano Zampini } 1937b965ef7fSBarry Smith its = its * lits; 193891723122SBarry Smith 193971f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19409566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194171f1c65dSBarry Smith a->fshift = fshift; 194271f1c65dSBarry Smith a->omega = omega; 1943ed480e8bSBarry Smith 194471f1c65dSBarry Smith diag = a->diag; 194571f1c65dSBarry Smith t = a->ssor_work; 1946ed480e8bSBarry Smith idiag = a->idiag; 194771f1c65dSBarry Smith mdiag = a->mdiag; 1948ed480e8bSBarry Smith 19499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19509566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19519566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1952ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195317ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195417ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1955ed480e8bSBarry Smith bs = b; 195617ab2063SBarry Smith for (i = 0; i < m; i++) { 195771f1c65dSBarry Smith d = fshift + mdiag[i]; 1958416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1959ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19602e5835c6SStefano Zampini v = aa + diag[i] + 1; 196117ab2063SBarry Smith sum = b[i] * d / omega; 1962003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196317ab2063SBarry Smith x[i] = sum; 196417ab2063SBarry Smith } 19659566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19689566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197017ab2063SBarry Smith } 1971c783ea89SBarry Smith 197208401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1973f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19744c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1975887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 197617ab2063SBarry Smith 197717ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197817ab2063SBarry Smith 1979887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198017ab2063SBarry Smith */ 198117ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198217ab2063SBarry Smith 198317ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1985416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1986ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19872e5835c6SStefano Zampini v = aa + diag[i] + 1; 198817ab2063SBarry Smith sum = b[i]; 1989e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1990ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199117ab2063SBarry Smith } 199217ab2063SBarry Smith 199317ab2063SBarry Smith /* t = b - (2*E - D)x */ 19942e5835c6SStefano Zampini v = aa; 19952205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 199617ab2063SBarry Smith 199717ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1998ed480e8bSBarry Smith ts = t; 1999416022c9SBarry Smith diag = a->diag; 200017ab2063SBarry Smith for (i = 0; i < m; i++) { 2001416022c9SBarry Smith n = diag[i] - a->i[i]; 2002ed480e8bSBarry Smith idx = a->j + a->i[i]; 20032e5835c6SStefano Zampini v = aa + a->i[i]; 200417ab2063SBarry Smith sum = t[i]; 2005003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2006ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2007733d66baSBarry Smith /* x = x + t */ 2008733d66baSBarry Smith x[i] += t[i]; 200917ab2063SBarry Smith } 201017ab2063SBarry Smith 20119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20139566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 201517ab2063SBarry Smith } 201617ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201717ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201817ab2063SBarry Smith for (i = 0; i < m; i++) { 2019416022c9SBarry Smith n = diag[i] - a->i[i]; 2020ed480e8bSBarry Smith idx = a->j + a->i[i]; 20212e5835c6SStefano Zampini v = aa + a->i[i]; 202217ab2063SBarry Smith sum = b[i]; 2023e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20245c99c7daSBarry Smith t[i] = sum; 2025ed480e8bSBarry Smith x[i] = sum * idiag[i]; 202617ab2063SBarry Smith } 20275c99c7daSBarry Smith xb = t; 20289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20293a40ed3dSBarry Smith } else xb = b; 203017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203117ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2032416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2033ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20342e5835c6SStefano Zampini v = aa + diag[i] + 1; 203517ab2063SBarry Smith sum = xb[i]; 2036e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20375c99c7daSBarry Smith if (xb == b) { 2038ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20395c99c7daSBarry Smith } else { 2040b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204117ab2063SBarry Smith } 20425c99c7daSBarry Smith } 20439566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204417ab2063SBarry Smith } 204517ab2063SBarry Smith its--; 204617ab2063SBarry Smith } 204717ab2063SBarry Smith while (its--) { 204817ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204917ab2063SBarry Smith for (i = 0; i < m; i++) { 2050b19a5dc2SMark Adams /* lower */ 2051b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2052ed480e8bSBarry Smith idx = a->j + a->i[i]; 20532e5835c6SStefano Zampini v = aa + a->i[i]; 205417ab2063SBarry Smith sum = b[i]; 2055e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2056b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2057b19a5dc2SMark Adams /* upper */ 2058b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2059b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20602e5835c6SStefano Zampini v = aa + diag[i] + 1; 2061b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2062b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206317ab2063SBarry Smith } 2064b19a5dc2SMark Adams xb = t; 20659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2066b19a5dc2SMark Adams } else xb = b; 206717ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206817ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2069b19a5dc2SMark Adams sum = xb[i]; 2070b19a5dc2SMark Adams if (xb == b) { 2071b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2072416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2073ed480e8bSBarry Smith idx = a->j + a->i[i]; 20742e5835c6SStefano Zampini v = aa + a->i[i]; 2075e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2076ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2077b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2078b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2079b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20802e5835c6SStefano Zampini v = aa + diag[i] + 1; 2081b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2082b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208317ab2063SBarry Smith } 2084b19a5dc2SMark Adams } 2085b19a5dc2SMark Adams if (xb == b) { 20869566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2087b19a5dc2SMark Adams } else { 20889566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2089b19a5dc2SMark Adams } 209017ab2063SBarry Smith } 209117ab2063SBarry Smith } 20929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20939566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 209617ab2063SBarry Smith } 209717ab2063SBarry Smith 2098ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2099d71ae5a4SJacob Faibussowitsch { 2100416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21014e220ebcSLois Curfman McInnes 21023a40ed3dSBarry Smith PetscFunctionBegin; 21034e220ebcSLois Curfman McInnes info->block_size = 1.0; 21043966268fSBarry Smith info->nz_allocated = a->maxnz; 21053966268fSBarry Smith info->nz_used = a->nz; 21063966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21073966268fSBarry Smith info->assemblies = A->num_ass; 21083966268fSBarry Smith info->mallocs = A->info.mallocs; 21094dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2110d5f3da31SBarry Smith if (A->factortype) { 21114e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21124e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21134e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21144e220ebcSLois Curfman McInnes } else { 21154e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21164e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21174e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21184e220ebcSLois Curfman McInnes } 21193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212017ab2063SBarry Smith } 212117ab2063SBarry Smith 2122ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2123d71ae5a4SJacob Faibussowitsch { 2124416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2125c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 212697b48c8fSBarry Smith const PetscScalar *xx; 21272e5835c6SStefano Zampini PetscScalar *bb, *aa; 2128c7da8527SEric Chamberland PetscInt d = 0; 212917ab2063SBarry Smith 21303a40ed3dSBarry Smith PetscFunctionBegin; 213197b48c8fSBarry Smith if (x && b) { 21329566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21339566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213497b48c8fSBarry Smith for (i = 0; i < N; i++) { 2135aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2136447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213797b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213897b48c8fSBarry Smith } 21399566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21409566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214197b48c8fSBarry Smith } 214297b48c8fSBarry Smith 21439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2144a9817697SBarry Smith if (a->keepnonzeropattern) { 2145f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2146aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21479566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2148f1e2ffcdSBarry Smith } 2149f4df32b1SMatthew Knepley if (diag != 0.0) { 2150c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2151c7da8527SEric Chamberland d = rows[i]; 2152447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215308401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2154c7da8527SEric Chamberland } 2155f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2156447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21572e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2158f1e2ffcdSBarry Smith } 2159f1e2ffcdSBarry Smith } 2160f1e2ffcdSBarry Smith } else { 2161f4df32b1SMatthew Knepley if (diag != 0.0) { 216217ab2063SBarry Smith for (i = 0; i < N; i++) { 2163aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21647ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2165447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2166447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2167447d62f5SStefano Zampini } else { 2168416022c9SBarry Smith a->ilen[rows[i]] = 1; 21692e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2170bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2171447d62f5SStefano Zampini } 2172447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21739566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217417ab2063SBarry Smith } 217517ab2063SBarry Smith } 21763a40ed3dSBarry Smith } else { 217717ab2063SBarry Smith for (i = 0; i < N; i++) { 2178aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2179416022c9SBarry Smith a->ilen[rows[i]] = 0; 218017ab2063SBarry Smith } 218117ab2063SBarry Smith } 2182e56f5c9eSBarry Smith A->nonzerostate++; 2183f1e2ffcdSBarry Smith } 21849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2185dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218717ab2063SBarry Smith } 218817ab2063SBarry Smith 2189ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2190d71ae5a4SJacob Faibussowitsch { 21916e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21926e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21932b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21946e169961SBarry Smith const PetscScalar *xx; 21952e5835c6SStefano Zampini PetscScalar *bb, *aa; 21966e169961SBarry Smith 21976e169961SBarry Smith PetscFunctionBegin; 21983ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 21999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22006e169961SBarry Smith if (x && b) { 22019566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22029566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22032b40b63fSBarry Smith vecs = PETSC_TRUE; 22046e169961SBarry Smith } 22059566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22066e169961SBarry Smith for (i = 0; i < N; i++) { 2207aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22088e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22092205254eSKarl Rupp 22106e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22116e169961SBarry Smith } 22126e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22136e169961SBarry Smith if (!zeroed[i]) { 22146e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22154cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22162e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22172e5835c6SStefano Zampini aa[j] = 0.0; 22186e169961SBarry Smith } 22196e169961SBarry Smith } 22204cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22216e169961SBarry Smith } 22226e169961SBarry Smith if (x && b) { 22239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22249566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22256e169961SBarry Smith } 22269566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22276e169961SBarry Smith if (diag != 0.0) { 22289566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22291d5a398dSstefano_zampini if (missing) { 22301d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22314cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2232aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22339566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22341d5a398dSstefano_zampini } 22351d5a398dSstefano_zampini } else { 2236ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22376e169961SBarry Smith } 22381d5a398dSstefano_zampini } 22399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2240dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22426e169961SBarry Smith } 22436e169961SBarry Smith 2244d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2245d71ae5a4SJacob Faibussowitsch { 2246fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2247fff043a9SJunchao Zhang const PetscScalar *aa; 224817ab2063SBarry Smith 22493a40ed3dSBarry Smith PetscFunctionBegin; 22509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2251416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22528e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225317ab2063SBarry Smith if (idx) { 22545c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2255f4259b30SLisandro Dalcin else *idx = NULL; 225617ab2063SBarry Smith } 22579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225917ab2063SBarry Smith } 226017ab2063SBarry Smith 2261d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2262d71ae5a4SJacob Faibussowitsch { 22633a40ed3dSBarry Smith PetscFunctionBegin; 22643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226517ab2063SBarry Smith } 226617ab2063SBarry Smith 2267ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2268d71ae5a4SJacob Faibussowitsch { 2269416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22702e5835c6SStefano Zampini const MatScalar *v; 227136db0b34SBarry Smith PetscReal sum = 0.0; 227297f1f81fSBarry Smith PetscInt i, j; 227317ab2063SBarry Smith 22743a40ed3dSBarry Smith PetscFunctionBegin; 22759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2277570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2278570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2279792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2280570b7f6dSBarry Smith #else 2281416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22829371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22839371c9d4SSatish Balay v++; 228417ab2063SBarry Smith } 22858f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2286570b7f6dSBarry Smith #endif 22879566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22883a40ed3dSBarry Smith } else if (type == NORM_1) { 228936db0b34SBarry Smith PetscReal *tmp; 229097f1f81fSBarry Smith PetscInt *jj = a->j; 22919566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2292064f8208SBarry Smith *nrm = 0.0; 2293416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22949371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22959371c9d4SSatish Balay v++; 229617ab2063SBarry Smith } 2297d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2298064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229917ab2063SBarry Smith } 23009566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23019566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23023a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2303064f8208SBarry Smith *nrm = 0.0; 2304d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23058e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 230617ab2063SBarry Smith sum = 0.0; 2307416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23089371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23099371c9d4SSatish Balay v2++; 231017ab2063SBarry Smith } 2311064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231217ab2063SBarry Smith } 23139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2314f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231717ab2063SBarry Smith } 231817ab2063SBarry Smith 2319ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2320d71ae5a4SJacob Faibussowitsch { 23213d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232254f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23232e5835c6SStefano Zampini const MatScalar *va, *vb; 232497f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2325cd0d46ebSvictorle 2326cd0d46ebSvictorle PetscFunctionBegin; 23279566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23289566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23295485867bSBarry Smith if (ma != nb || na != mb) { 23305485867bSBarry Smith *f = PETSC_FALSE; 23313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23325485867bSBarry Smith } 23339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23359371c9d4SSatish Balay aii = aij->i; 23369371c9d4SSatish Balay bii = bij->i; 23379371c9d4SSatish Balay adx = aij->j; 23389371c9d4SSatish Balay bdx = bij->j; 23399566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2341cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2342cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2343cd0d46ebSvictorle 2344cd0d46ebSvictorle *f = PETSC_TRUE; 2345cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2346cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234797f1f81fSBarry Smith PetscInt idc, idr; 23485485867bSBarry Smith PetscScalar vc, vr; 2349cd0d46ebSvictorle /* column/row index/value */ 23505485867bSBarry Smith idc = adx[aptr[i]]; 23515485867bSBarry Smith idr = bdx[bptr[idc]]; 23525485867bSBarry Smith vc = va[aptr[i]]; 23535485867bSBarry Smith vr = vb[bptr[idc]]; 23545485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23555485867bSBarry Smith *f = PETSC_FALSE; 23565485867bSBarry Smith goto done; 2357cd0d46ebSvictorle } else { 23585485867bSBarry Smith aptr[i]++; 23595485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle } 2362cd0d46ebSvictorle } 2363cd0d46ebSvictorle done: 23649566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23659566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2369cd0d46ebSvictorle } 2370cd0d46ebSvictorle 2371ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2372d71ae5a4SJacob Faibussowitsch { 23733d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237454f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 237554f21887SBarry Smith MatScalar *va, *vb; 23761cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23771cbb95d3SBarry Smith 23781cbb95d3SBarry Smith PetscFunctionBegin; 23799566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23809566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23811cbb95d3SBarry Smith if (ma != nb || na != mb) { 23821cbb95d3SBarry Smith *f = PETSC_FALSE; 23833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23841cbb95d3SBarry Smith } 23859371c9d4SSatish Balay aii = aij->i; 23869371c9d4SSatish Balay bii = bij->i; 23879371c9d4SSatish Balay adx = aij->j; 23889371c9d4SSatish Balay bdx = bij->j; 23899371c9d4SSatish Balay va = aij->a; 23909371c9d4SSatish Balay vb = bij->a; 23919566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23931cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23941cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23951cbb95d3SBarry Smith 23961cbb95d3SBarry Smith *f = PETSC_TRUE; 23971cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23981cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23991cbb95d3SBarry Smith PetscInt idc, idr; 24001cbb95d3SBarry Smith PetscScalar vc, vr; 24011cbb95d3SBarry Smith /* column/row index/value */ 24021cbb95d3SBarry Smith idc = adx[aptr[i]]; 24031cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24041cbb95d3SBarry Smith vc = va[aptr[i]]; 24051cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24061cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24071cbb95d3SBarry Smith *f = PETSC_FALSE; 24081cbb95d3SBarry Smith goto done; 24091cbb95d3SBarry Smith } else { 24101cbb95d3SBarry Smith aptr[i]++; 24111cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24121cbb95d3SBarry Smith } 24131cbb95d3SBarry Smith } 24141cbb95d3SBarry Smith } 24151cbb95d3SBarry Smith done: 24169566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24179566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith 2421d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2422d71ae5a4SJacob Faibussowitsch { 2423416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2424fff8e43fSBarry Smith const PetscScalar *l, *r; 2425fff8e43fSBarry Smith PetscScalar x; 242654f21887SBarry Smith MatScalar *v; 2427fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2428fff8e43fSBarry Smith const PetscInt *jj; 242917ab2063SBarry Smith 24303a40ed3dSBarry Smith PetscFunctionBegin; 243117ab2063SBarry Smith if (ll) { 24323ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24333ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24349566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 243508401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24369566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 243817ab2063SBarry Smith for (i = 0; i < m; i++) { 243917ab2063SBarry Smith x = l[i]; 2440416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24412205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244217ab2063SBarry Smith } 24439566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24449566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 244617ab2063SBarry Smith } 244717ab2063SBarry Smith if (rr) { 24489566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 244908401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24509566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24522e5835c6SStefano Zampini jj = a->j; 24532205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24559566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24569566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 245717ab2063SBarry Smith } 24589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 246017ab2063SBarry Smith } 246117ab2063SBarry Smith 2462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2463d71ae5a4SJacob Faibussowitsch { 2464db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2465d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 246697f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24675d0c19d7SBarry Smith const PetscInt *irow, *icol; 24682e5835c6SStefano Zampini const PetscScalar *aa; 24695d0c19d7SBarry Smith PetscInt nrows, ncols; 247097f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2471fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2472416022c9SBarry Smith Mat C; 2473cdc6f3adSToby Isaac PetscBool stride; 247417ab2063SBarry Smith 24753a40ed3dSBarry Smith PetscFunctionBegin; 24769566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24779566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24789566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 247917ab2063SBarry Smith 24809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2481ff718158SBarry Smith if (stride) { 24829566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2483ff718158SBarry Smith } else { 2484ff718158SBarry Smith first = 0; 2485ff718158SBarry Smith step = 0; 2486ff718158SBarry Smith } 2487fee21e36SBarry Smith if (stride && step == 1) { 248802834360SBarry Smith /* special case of contiguous rows */ 24899566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249002834360SBarry Smith /* loop over new rows determining lens and starting points */ 249102834360SBarry Smith for (i = 0; i < nrows; i++) { 2492bfeeae90SHong Zhang kstart = ai[irow[i]]; 2493a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2494a91a9bebSLisandro Dalcin starts[i] = kstart; 249502834360SBarry Smith for (k = kstart; k < kend; k++) { 2496bfeeae90SHong Zhang if (aj[k] >= first) { 249702834360SBarry Smith starts[i] = k; 249802834360SBarry Smith break; 249902834360SBarry Smith } 250002834360SBarry Smith } 2501a2744918SBarry Smith sum = 0; 250202834360SBarry Smith while (k < kend) { 2503bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2504a2744918SBarry Smith sum++; 250502834360SBarry Smith } 2506a2744918SBarry Smith lens[i] = sum; 250702834360SBarry Smith } 250802834360SBarry Smith /* create submatrix */ 2509cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251097f1f81fSBarry Smith PetscInt n_cols, n_rows; 25119566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2512aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25139566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251408480c60SBarry Smith C = *B; 25153a40ed3dSBarry Smith } else { 25163bef6203SJed Brown PetscInt rbs, cbs; 25179566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25189566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25199566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25209566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25219566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25229566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252408480c60SBarry Smith } 2525db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2526db02288aSLois Curfman McInnes 252702834360SBarry Smith /* loop over rows inserting into submatrix */ 2528fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2529db02288aSLois Curfman McInnes j_new = c->j; 2530db02288aSLois Curfman McInnes i_new = c->i; 25319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253202834360SBarry Smith for (i = 0; i < nrows; i++) { 2533a2744918SBarry Smith ii = starts[i]; 2534a2744918SBarry Smith lensi = lens[i]; 2535810441c8SPierre Jolivet if (lensi) { 2536ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2538a2744918SBarry Smith a_new += lensi; 2539810441c8SPierre Jolivet } 2540a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2541a2744918SBarry Smith c->ilen[i] = lensi; 254202834360SBarry Smith } 2543fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25459566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25463a40ed3dSBarry Smith } else { 25479566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25489566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25504dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25516bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25524dcab191SBarry Smith smap[icol[i]] = i + 1; 25534dcab191SBarry Smith } 25544dcab191SBarry Smith 255502834360SBarry Smith /* determine lens of each row */ 255602834360SBarry Smith for (i = 0; i < nrows; i++) { 2557bfeeae90SHong Zhang kstart = ai[irow[i]]; 255802834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 255902834360SBarry Smith lens[i] = 0; 256002834360SBarry Smith for (k = kstart; k < kend; k++) { 2561ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256202834360SBarry Smith } 256302834360SBarry Smith } 256417ab2063SBarry Smith /* Create and fill new matrix */ 2565a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2566ace3abfcSBarry Smith PetscBool equal; 25670f5bd95cSBarry Smith 256899141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2569aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25709566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2571fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25729566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257308480c60SBarry Smith C = *B; 25743a40ed3dSBarry Smith } else { 25753bef6203SJed Brown PetscInt rbs, cbs; 25769566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25779566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25789566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25799566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 258037a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25819566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258308480c60SBarry Smith } 25849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2585fb3c7e2dSJunchao Zhang 2586f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2587fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 258817ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258999141d43SSatish Balay row = irow[i]; 2590bfeeae90SHong Zhang kstart = ai[row]; 259199141d43SSatish Balay kend = kstart + a->ilen[row]; 2592bfeeae90SHong Zhang mat_i = c->i[i]; 25938e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25948e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 259599141d43SSatish Balay mat_ilen = c->ilen + i; 259617ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2597bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2598ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25992e5835c6SStefano Zampini *mat_a++ = aa[k]; 260099141d43SSatish Balay (*mat_ilen)++; 260117ab2063SBarry Smith } 260217ab2063SBarry Smith } 260317ab2063SBarry Smith } 26049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260502834360SBarry Smith /* Free work space */ 26069566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26079566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26089566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2609cdc6f3adSToby Isaac /* sort */ 2610cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2611cdc6f3adSToby Isaac PetscInt ilen; 2612cdc6f3adSToby Isaac 2613cdc6f3adSToby Isaac mat_i = c->i[i]; 26148e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26158e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2616cdc6f3adSToby Isaac ilen = c->ilen[i]; 26179566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2618cdc6f3adSToby Isaac } 2619fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 262002834360SBarry Smith } 26218c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26229566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2623305c6ccfSStefano Zampini #endif 26249566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26259566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262617ab2063SBarry Smith 26279566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2628416022c9SBarry Smith *B = C; 26293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 263017ab2063SBarry Smith } 263117ab2063SBarry Smith 2632ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2633d71ae5a4SJacob Faibussowitsch { 263482d44351SHong Zhang Mat B; 263582d44351SHong Zhang 263682d44351SHong Zhang PetscFunctionBegin; 2637c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26389566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26409566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26419566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26429566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264382d44351SHong Zhang *subMat = B; 2644c2d650bdSHong Zhang } else { 26459566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2646c2d650bdSHong Zhang } 26473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264882d44351SHong Zhang } 264982d44351SHong Zhang 2650ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2651d71ae5a4SJacob Faibussowitsch { 265263b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265363b91edcSBarry Smith Mat outA; 2654ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265563b91edcSBarry Smith 26563a40ed3dSBarry Smith PetscFunctionBegin; 265708401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26581df811f5SHong Zhang 26599566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26609566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2661a871dcd8SBarry Smith 266263b91edcSBarry Smith outA = inA; 2663d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26649566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26659566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26662205254eSKarl Rupp 26679566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26689566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26692205254eSKarl Rupp 2670c3122656SLisandro Dalcin a->row = row; 26712205254eSKarl Rupp 26729566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26739566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26742205254eSKarl Rupp 2675c3122656SLisandro Dalcin a->col = col; 267663b91edcSBarry Smith 267736db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26789566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26799566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2680f0ec6fceSSatish Balay 268194a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268394a9d846SBarry Smith } 268463b91edcSBarry Smith 26859566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2686137fb511SHong Zhang if (row_identity && col_identity) { 26879566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2688137fb511SHong Zhang } else { 26899566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2690137fb511SHong Zhang } 26913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2692a871dcd8SBarry Smith } 2693a871dcd8SBarry Smith 2694d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2695d71ae5a4SJacob Faibussowitsch { 2696f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2697dfa0f9e5SStefano Zampini PetscScalar *v; 2698c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26993a40ed3dSBarry Smith 27003a40ed3dSBarry Smith PetscFunctionBegin; 27019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27029566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2703792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2708f0b747eeSBarry Smith } 2709f0b747eeSBarry Smith 2710d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2711d71ae5a4SJacob Faibussowitsch { 271216b64355SHong Zhang PetscInt i; 271316b64355SHong Zhang 271416b64355SHong Zhang PetscFunctionBegin; 271516b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27169566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271716b64355SHong Zhang 271848a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27199566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272016b64355SHong Zhang 272116b64355SHong Zhang if (submatj->rbuf1) { 27229566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27239566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272416b64355SHong Zhang } 272516b64355SHong Zhang 272648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27279566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27289566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272916b64355SHong Zhang } 273016b64355SHong Zhang 273116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2732eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27339566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273516b64355SHong Zhang #else 27369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273716b64355SHong Zhang #endif 273816b64355SHong Zhang 273916b64355SHong Zhang if (!submatj->allcolumns) { 274016b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2741835f2295SStefano Zampini PetscCall(PetscHMapIDestroy(&submatj->cmap)); 274216b64355SHong Zhang #else 27439566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274416b64355SHong Zhang #endif 274516b64355SHong Zhang } 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274716b64355SHong Zhang 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275016b64355SHong Zhang } 275116b64355SHong Zhang 2752d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2753d71ae5a4SJacob Faibussowitsch { 275416b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27555c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275616b64355SHong Zhang 275716b64355SHong Zhang PetscFunctionBegin; 27589566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27599566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276116b64355SHong Zhang } 276216b64355SHong Zhang 276389a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2764ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2765d71ae5a4SJacob Faibussowitsch { 27662d033e1fSHong Zhang PetscInt i; 27670fb991dcSHong Zhang Mat C; 27680fb991dcSHong Zhang Mat_SeqAIJ *c; 27690fb991dcSHong Zhang Mat_SubSppt *submatj; 27702d033e1fSHong Zhang 27712d033e1fSHong Zhang PetscFunctionBegin; 27722d033e1fSHong Zhang for (i = 0; i < n; i++) { 27730fb991dcSHong Zhang C = (*mat)[i]; 27740fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27750fb991dcSHong Zhang submatj = c->submatis1; 27762d033e1fSHong Zhang if (submatj) { 2777682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277826cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27799566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27809566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27819566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27823faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27839566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27849566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27859566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2786682e4c99SStefano Zampini } 27872d033e1fSHong Zhang } else { 27889566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27892d033e1fSHong Zhang } 27902d033e1fSHong Zhang } 279186e85357SHong Zhang 279263a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27939566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279463a75b2aSHong Zhang 27959566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27972d033e1fSHong Zhang } 27982d033e1fSHong Zhang 2799ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2800d71ae5a4SJacob Faibussowitsch { 280197f1f81fSBarry Smith PetscInt i; 2802cddf8d76SBarry Smith 28033a40ed3dSBarry Smith PetscFunctionBegin; 280448a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2805cddf8d76SBarry Smith 280648a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2808cddf8d76SBarry Smith } 2809cddf8d76SBarry Smith 2810ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2811d71ae5a4SJacob Faibussowitsch { 2812e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28139a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28145d0c19d7SBarry Smith const PetscInt *idx; 281558b7e2c1SStefano Zampini PetscInt start, end, *ai, *aj, bs = A->rmap->bs == A->cmap->bs ? A->rmap->bs : 1; 2816f1af5d2fSBarry Smith PetscBT table; 2817bbd702dbSSatish Balay 28183a40ed3dSBarry Smith PetscFunctionBegin; 28199a88ca10SBarry Smith m = A->rmap->n / bs; 2820e4d965acSSatish Balay ai = a->i; 2821bfeeae90SHong Zhang aj = a->j; 28228a047759SSatish Balay 282308401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282406763907SSatish Balay 28259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28269566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282706763907SSatish Balay 2828e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2829b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2830e4d965acSSatish Balay isz = 0; 28319566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2832e4d965acSSatish Balay 2833e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28349566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28359566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2836e4d965acSSatish Balay 28379a88ca10SBarry Smith if (bs > 1) { 28389a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28399a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28409a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28419a88ca10SBarry Smith } 28429a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28439a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28449a88ca10SBarry Smith 28459a88ca10SBarry Smith k = 0; 28469a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28479a88ca10SBarry Smith n = isz; 28489a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28499a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28509a88ca10SBarry Smith row = bs * nidx[k] + ll; 28519a88ca10SBarry Smith start = ai[row]; 28529a88ca10SBarry Smith end = ai[row + 1]; 28539a88ca10SBarry Smith for (l = start; l < end; l++) { 28549a88ca10SBarry Smith val = aj[l] / bs; 28559a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28569a88ca10SBarry Smith } 28579a88ca10SBarry Smith } 28589a88ca10SBarry Smith } 28599a88ca10SBarry Smith } 286057508eceSPierre Jolivet PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i)); 28619a88ca10SBarry Smith } else { 2862dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2863e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28642205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28654dcbc457SBarry Smith } 28669566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28679566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2868e4d965acSSatish Balay 286904a348a9SBarry Smith k = 0; 287004a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287104a348a9SBarry Smith n = isz; 287206763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2873e4d965acSSatish Balay row = nidx[k]; 2874e4d965acSSatish Balay start = ai[row]; 2875e4d965acSSatish Balay end = ai[row + 1]; 287604a348a9SBarry Smith for (l = start; l < end; l++) { 2877efb16452SHong Zhang val = aj[l]; 28782205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2879e4d965acSSatish Balay } 2880e4d965acSSatish Balay } 2881e4d965acSSatish Balay } 288257508eceSPierre Jolivet PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i)); 2883e4d965acSSatish Balay } 28849a88ca10SBarry Smith } 28859566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28869566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28884dcbc457SBarry Smith } 288917ab2063SBarry Smith 2890ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2891d71ae5a4SJacob Faibussowitsch { 28920513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28933b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28945d0c19d7SBarry Smith const PetscInt *row, *col; 28955d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 289656cd22aeSBarry Smith IS icolp, irowp; 28970298fd71SBarry Smith PetscInt *cwork = NULL; 28980298fd71SBarry Smith PetscScalar *vwork = NULL; 28990513a670SBarry Smith 29003a40ed3dSBarry Smith PetscFunctionBegin; 29019566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29029566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29039566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29049566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29050513a670SBarry Smith 29060513a670SBarry Smith /* determine lengths of permuted rows */ 29079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29082205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29099566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29119566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29129566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29149566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29150513a670SBarry Smith 29169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29170513a670SBarry Smith for (i = 0; i < m; i++) { 29189566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29192205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29209566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29219566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29220513a670SBarry Smith } 29239566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29242205254eSKarl Rupp 29253c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29262205254eSKarl Rupp 29278c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29289566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29299fe5e383SStefano Zampini #endif 29309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29329566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29339566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29349566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29359566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 293648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29380513a670SBarry Smith } 29390513a670SBarry Smith 2940d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2941d71ae5a4SJacob Faibussowitsch { 2942cb5b572fSBarry Smith PetscFunctionBegin; 294333f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294433f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2945be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2946be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29472e5835c6SStefano Zampini const PetscScalar *aa; 29483ac85a22SJunchao Zhang PetscScalar *bb; 2949be6bf707SBarry Smith 29509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 29513ac85a22SJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(B, &bb)); 29523ac85a22SJunchao Zhang 295308401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29543ac85a22SJunchao Zhang PetscCall(PetscArraycpy(bb, aa, a->i[A->rmap->n])); 29559566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 29573ac85a22SJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(B, &bb)); 2958cb5b572fSBarry Smith } else { 29599566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2960cb5b572fSBarry Smith } 29613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2962cb5b572fSBarry Smith } 2963cb5b572fSBarry Smith 2964d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2965d71ae5a4SJacob Faibussowitsch { 29666c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29676e111a19SKarl Rupp 29686c0721eeSBarry Smith PetscFunctionBegin; 29696c0721eeSBarry Smith *array = a->a; 29703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29716c0721eeSBarry Smith } 29726c0721eeSBarry Smith 2973d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2974d71ae5a4SJacob Faibussowitsch { 29756c0721eeSBarry Smith PetscFunctionBegin; 2976f38c1e66SStefano Zampini *array = NULL; 29773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29786c0721eeSBarry Smith } 2979273d9f13SBarry Smith 29808229c054SShri Abhyankar /* 29818229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29828229c054SShri Abhyankar have different nonzero structure. 29838229c054SShri Abhyankar */ 2984d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2985d71ae5a4SJacob Faibussowitsch { 2986b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2987ec7775f6SShri Abhyankar 2988ec7775f6SShri Abhyankar PetscFunctionBegin; 2989ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2990ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29918e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2992b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2993b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29948af7cee1SJed Brown nnz[i] = 0; 29958af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2996b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2997b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29988af7cee1SJed Brown nnz[i]++; 29998af7cee1SJed Brown } 30008af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3001ec7775f6SShri Abhyankar } 30023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3003ec7775f6SShri Abhyankar } 3004ec7775f6SShri Abhyankar 3005d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3006d71ae5a4SJacob Faibussowitsch { 3007b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3008b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3009b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3010b264fe52SHong Zhang 3011b264fe52SHong Zhang PetscFunctionBegin; 3012b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30139566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3015b264fe52SHong Zhang } 3016b264fe52SHong Zhang 3017d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3018d71ae5a4SJacob Faibussowitsch { 3019ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3020ac90fabeSBarry Smith 3021ac90fabeSBarry Smith PetscFunctionBegin; 3022134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3023134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3024134adf20SPierre Jolivet if (e) { 30259566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302681fa06acSBarry Smith if (e) { 30279566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3028134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 302981fa06acSBarry Smith } 303081fa06acSBarry Smith } 303154c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303281fa06acSBarry Smith } 3033ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30342e5835c6SStefano Zampini const PetscScalar *xa; 30352e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303681fa06acSBarry Smith PetscBLASInt one = 1, bnz; 303781fa06acSBarry Smith 30389566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3041792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30449566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30469566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3047ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30489566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3049ac90fabeSBarry Smith } else { 30508229c054SShri Abhyankar Mat B; 30518229c054SShri Abhyankar PetscInt *nnz; 30529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30539566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30549566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30559566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30569566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30579566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30599566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30609566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30619bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30629566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3063ac90fabeSBarry Smith } 30643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3065ac90fabeSBarry Smith } 3066ac90fabeSBarry Smith 3067d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3068d71ae5a4SJacob Faibussowitsch { 3069354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3070354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3071354c94deSBarry Smith PetscInt i, nz; 3072354c94deSBarry Smith PetscScalar *a; 3073354c94deSBarry Smith 3074354c94deSBarry Smith PetscFunctionBegin; 3075354c94deSBarry Smith nz = aij->nz; 30769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30772205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3079354c94deSBarry Smith #else 3080354c94deSBarry Smith PetscFunctionBegin; 3081354c94deSBarry Smith #endif 30823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3083354c94deSBarry Smith } 3084354c94deSBarry Smith 3085ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3086d71ae5a4SJacob Faibussowitsch { 3087e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3088d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3089e34fafa9SBarry Smith PetscReal atmp; 3090985db425SBarry Smith PetscScalar *x; 3091ce496241SStefano Zampini const MatScalar *aa, *av; 3092e34fafa9SBarry Smith 3093e34fafa9SBarry Smith PetscFunctionBegin; 309428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3096ce496241SStefano Zampini aa = av; 3097e34fafa9SBarry Smith ai = a->i; 3098e34fafa9SBarry Smith aj = a->j; 3099e34fafa9SBarry Smith 31009566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31019566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3103e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31049371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31059371c9d4SSatish Balay ai++; 310662e5df07SMark Adams x[i] = 0; 3107e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3108985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31099371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31109371c9d4SSatish Balay x[i] = atmp; 31119371c9d4SSatish Balay if (idx) idx[i] = *aj; 31129371c9d4SSatish Balay } 31139371c9d4SSatish Balay aa++; 31149371c9d4SSatish Balay aj++; 3115985db425SBarry Smith } 3116985db425SBarry Smith } 31179566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3120985db425SBarry Smith } 3121985db425SBarry Smith 3122eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3123eede4a3fSMark Adams { 3124eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3125eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3126eede4a3fSMark Adams PetscScalar *x; 3127eede4a3fSMark Adams const MatScalar *aa, *av; 3128eede4a3fSMark Adams 3129eede4a3fSMark Adams PetscFunctionBegin; 3130eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3131eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3132eede4a3fSMark Adams aa = av; 3133eede4a3fSMark Adams ai = a->i; 3134eede4a3fSMark Adams 3135eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3136eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3137eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3138eede4a3fSMark Adams for (i = 0; i < m; i++) { 3139eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3140eede4a3fSMark Adams ai++; 314162e5df07SMark Adams x[i] = 0; 3142eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3143eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3144eede4a3fSMark Adams aa++; 3145eede4a3fSMark Adams } 3146eede4a3fSMark Adams } 3147eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3148eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3149eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3150eede4a3fSMark Adams } 3151eede4a3fSMark Adams 3152ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3153d71ae5a4SJacob Faibussowitsch { 3154985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3155d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3156985db425SBarry Smith PetscScalar *x; 3157ce496241SStefano Zampini const MatScalar *aa, *av; 3158985db425SBarry Smith 3159985db425SBarry Smith PetscFunctionBegin; 316028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3162ce496241SStefano Zampini aa = av; 3163985db425SBarry Smith ai = a->i; 3164985db425SBarry Smith aj = a->j; 3165985db425SBarry Smith 31669566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31679566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3169985db425SBarry Smith for (i = 0; i < m; i++) { 31709371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31719371c9d4SSatish Balay ai++; 3172d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31739371c9d4SSatish Balay x[i] = *aa; 31749371c9d4SSatish Balay if (idx) idx[i] = 0; 3175985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3176985db425SBarry Smith x[i] = 0.0; 3177985db425SBarry Smith if (idx) { 3178985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3179985db425SBarry Smith if (aj[j] > j) { 3180985db425SBarry Smith idx[i] = j; 3181985db425SBarry Smith break; 3182985db425SBarry Smith } 3183985db425SBarry Smith } 31841a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31851a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3186985db425SBarry Smith } 3187985db425SBarry Smith } 3188985db425SBarry Smith for (j = 0; j < ncols; j++) { 31899371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31909371c9d4SSatish Balay x[i] = *aa; 31919371c9d4SSatish Balay if (idx) idx[i] = *aj; 31929371c9d4SSatish Balay } 31939371c9d4SSatish Balay aa++; 31949371c9d4SSatish Balay aj++; 3195985db425SBarry Smith } 3196985db425SBarry Smith } 31979566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3200985db425SBarry Smith } 3201985db425SBarry Smith 3202ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3203d71ae5a4SJacob Faibussowitsch { 3204c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3205c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3206ce496241SStefano Zampini PetscScalar *x; 3207ce496241SStefano Zampini const MatScalar *aa, *av; 3208c87e5d42SMatthew Knepley 3209c87e5d42SMatthew Knepley PetscFunctionBegin; 32109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3211ce496241SStefano Zampini aa = av; 3212c87e5d42SMatthew Knepley ai = a->i; 3213c87e5d42SMatthew Knepley aj = a->j; 3214c87e5d42SMatthew Knepley 32159566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32169566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321708401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3218c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32199371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32209371c9d4SSatish Balay ai++; 3221f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32229371c9d4SSatish Balay x[i] = *aa; 32239371c9d4SSatish Balay if (idx) idx[i] = 0; 3224f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3225f07e67edSHong Zhang x[i] = 0.0; 3226f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3227289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3228f07e67edSHong Zhang if (aj[j] > j) { 3229f07e67edSHong Zhang idx[i] = j; 32302205254eSKarl Rupp break; 32312205254eSKarl Rupp } 3232289a08f5SMatthew Knepley } 3233f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3234f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3235f07e67edSHong Zhang } 3236289a08f5SMatthew Knepley } 3237c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32389371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32399371c9d4SSatish Balay x[i] = *aa; 32409371c9d4SSatish Balay if (idx) idx[i] = *aj; 32419371c9d4SSatish Balay } 32429371c9d4SSatish Balay aa++; 32439371c9d4SSatish Balay aj++; 3244c87e5d42SMatthew Knepley } 3245c87e5d42SMatthew Knepley } 32469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3249c87e5d42SMatthew Knepley } 3250c87e5d42SMatthew Knepley 3251ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3252d71ae5a4SJacob Faibussowitsch { 3253985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3254d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3255d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3256985db425SBarry Smith PetscScalar *x; 3257ce496241SStefano Zampini const MatScalar *aa, *av; 3258985db425SBarry Smith 3259985db425SBarry Smith PetscFunctionBegin; 326028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3262ce496241SStefano Zampini aa = av; 3263985db425SBarry Smith ai = a->i; 3264985db425SBarry Smith aj = a->j; 3265985db425SBarry Smith 32669566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32679566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 326808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3269985db425SBarry Smith for (i = 0; i < m; i++) { 32709371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32719371c9d4SSatish Balay ai++; 3272d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32739371c9d4SSatish Balay x[i] = *aa; 32749371c9d4SSatish Balay if (idx) idx[i] = 0; 3275985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3276985db425SBarry Smith x[i] = 0.0; 3277985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3278985db425SBarry Smith for (j = 0; j < ncols; j++) { 3279985db425SBarry Smith if (aj[j] > j) { 3280985db425SBarry Smith idx[i] = j; 3281985db425SBarry Smith break; 3282985db425SBarry Smith } 3283985db425SBarry Smith } 3284fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3285fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3286985db425SBarry Smith } 3287985db425SBarry Smith } 3288985db425SBarry Smith for (j = 0; j < ncols; j++) { 32899371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32909371c9d4SSatish Balay x[i] = *aa; 32919371c9d4SSatish Balay if (idx) idx[i] = *aj; 32929371c9d4SSatish Balay } 32939371c9d4SSatish Balay aa++; 32949371c9d4SSatish Balay aj++; 3295e34fafa9SBarry Smith } 3296e34fafa9SBarry Smith } 32979566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3300e34fafa9SBarry Smith } 3301bbead8a2SBarry Smith 3302ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3303d71ae5a4SJacob Faibussowitsch { 3304bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 330558b7e2c1SStefano Zampini PetscInt i, bs = A->rmap->bs, mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3306bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33070da83c2eSBarry Smith const PetscReal shift = 0.0; 33081a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3309bbead8a2SBarry Smith 3310bbead8a2SBarry Smith PetscFunctionBegin; 3311a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33124a0d0026SBarry Smith if (a->ibdiagvalid) { 33134a0d0026SBarry Smith if (values) *values = a->ibdiag; 33143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33154a0d0026SBarry Smith } 33169566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33174dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3318bbead8a2SBarry Smith diag = a->ibdiag; 3319bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3320bbead8a2SBarry Smith /* factor and invert each block */ 3321bbead8a2SBarry Smith switch (bs) { 3322bbead8a2SBarry Smith case 1: 3323bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33249566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3325ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3326ec1892c8SHong Zhang if (allowzeropivot) { 33277b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33287b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33297b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33309566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 333198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3332ec1892c8SHong Zhang } 3333bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3334bbead8a2SBarry Smith } 3335bbead8a2SBarry Smith break; 3336bbead8a2SBarry Smith case 2: 3337bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33389371c9d4SSatish Balay ij[0] = 2 * i; 33399371c9d4SSatish Balay ij[1] = 2 * i + 1; 33409566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33427b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3344bbead8a2SBarry Smith diag += 4; 3345bbead8a2SBarry Smith } 3346bbead8a2SBarry Smith break; 3347bbead8a2SBarry Smith case 3: 3348bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33499371c9d4SSatish Balay ij[0] = 3 * i; 33509371c9d4SSatish Balay ij[1] = 3 * i + 1; 33519371c9d4SSatish Balay ij[2] = 3 * i + 2; 33529566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33547b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3356bbead8a2SBarry Smith diag += 9; 3357bbead8a2SBarry Smith } 3358bbead8a2SBarry Smith break; 3359bbead8a2SBarry Smith case 4: 3360bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33619371c9d4SSatish Balay ij[0] = 4 * i; 33629371c9d4SSatish Balay ij[1] = 4 * i + 1; 33639371c9d4SSatish Balay ij[2] = 4 * i + 2; 33649371c9d4SSatish Balay ij[3] = 4 * i + 3; 33659566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33677b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33689566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3369bbead8a2SBarry Smith diag += 16; 3370bbead8a2SBarry Smith } 3371bbead8a2SBarry Smith break; 3372bbead8a2SBarry Smith case 5: 3373bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33749371c9d4SSatish Balay ij[0] = 5 * i; 33759371c9d4SSatish Balay ij[1] = 5 * i + 1; 33769371c9d4SSatish Balay ij[2] = 5 * i + 2; 33779371c9d4SSatish Balay ij[3] = 5 * i + 3; 33789371c9d4SSatish Balay ij[4] = 5 * i + 4; 33799566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33817b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3383bbead8a2SBarry Smith diag += 25; 3384bbead8a2SBarry Smith } 3385bbead8a2SBarry Smith break; 3386bbead8a2SBarry Smith case 6: 3387bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33889371c9d4SSatish Balay ij[0] = 6 * i; 33899371c9d4SSatish Balay ij[1] = 6 * i + 1; 33909371c9d4SSatish Balay ij[2] = 6 * i + 2; 33919371c9d4SSatish Balay ij[3] = 6 * i + 3; 33929371c9d4SSatish Balay ij[4] = 6 * i + 4; 33939371c9d4SSatish Balay ij[5] = 6 * i + 5; 33949566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33959566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33967b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33979566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3398bbead8a2SBarry Smith diag += 36; 3399bbead8a2SBarry Smith } 3400bbead8a2SBarry Smith break; 3401bbead8a2SBarry Smith case 7: 3402bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34039371c9d4SSatish Balay ij[0] = 7 * i; 34049371c9d4SSatish Balay ij[1] = 7 * i + 1; 34059371c9d4SSatish Balay ij[2] = 7 * i + 2; 34069371c9d4SSatish Balay ij[3] = 7 * i + 3; 34079371c9d4SSatish Balay ij[4] = 7 * i + 4; 34089371c9d4SSatish Balay ij[5] = 7 * i + 5; 3409cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34109566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34119566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34127b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34139566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3414bbead8a2SBarry Smith diag += 49; 3415bbead8a2SBarry Smith } 3416bbead8a2SBarry Smith break; 3417bbead8a2SBarry Smith default: 34189566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3419bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3420ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34219566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34237b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34249566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3425bbead8a2SBarry Smith diag += bs2; 3426bbead8a2SBarry Smith } 34279566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3428bbead8a2SBarry Smith } 3429bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3431bbead8a2SBarry Smith } 3432bbead8a2SBarry Smith 3433d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3434d71ae5a4SJacob Faibussowitsch { 343573a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3436fff043a9SJunchao Zhang PetscScalar a, *aa; 343773a71a0fSBarry Smith PetscInt m, n, i, j, col; 343873a71a0fSBarry Smith 343973a71a0fSBarry Smith PetscFunctionBegin; 344073a71a0fSBarry Smith if (!x->assembled) { 34419566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 344273a71a0fSBarry Smith for (i = 0; i < m; i++) { 344373a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34449566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 344573a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34469566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 344773a71a0fSBarry Smith } 344873a71a0fSBarry Smith } 3449e2ce353bSJunchao Zhang } else { 34509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34519566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3453e2ce353bSJunchao Zhang } 34549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 345773a71a0fSBarry Smith } 345873a71a0fSBarry Smith 3459679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3460d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3461d71ae5a4SJacob Faibussowitsch { 3462679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3463679944adSJunchao Zhang PetscScalar a; 3464679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3465679944adSJunchao Zhang 3466679944adSJunchao Zhang PetscFunctionBegin; 3467679944adSJunchao Zhang nskip = high - low; 34689566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3469679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3470679944adSJunchao Zhang for (i = 0; i < m; i++) { 3471679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34729566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3473679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3474679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34759566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3476679944adSJunchao Zhang } 3477e2ce353bSJunchao Zhang } 34789566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34799566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3481679944adSJunchao Zhang } 3482679944adSJunchao Zhang 34830a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3484cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3485cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3486cb5b572fSBarry Smith MatMult_SeqAIJ, 348797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34887c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34897c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3490f4259b30SLisandro Dalcin NULL, 3491f4259b30SLisandro Dalcin NULL, 3492f4259b30SLisandro Dalcin NULL, 3493f4259b30SLisandro Dalcin /* 10*/ NULL, 3494cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3495f4259b30SLisandro Dalcin NULL, 349641f059aeSBarry Smith MatSOR_SeqAIJ, 349791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349897304618SKris Buschelman /* 15*/ MatGetInfo_SeqAIJ, 3499cb5b572fSBarry Smith MatEqual_SeqAIJ, 3500cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3501cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3502cb5b572fSBarry Smith MatNorm_SeqAIJ, 3503f4259b30SLisandro Dalcin /* 20*/ NULL, 3504cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3505cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3506cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3507d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 351226cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 3516f4259b30SLisandro Dalcin NULL, 3517d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3521f4259b30SLisandro Dalcin NULL, 3522d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35237dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3524cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3525cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3526cb5b572fSBarry Smith MatCopy_SeqAIJ, 3527d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3528cb5b572fSBarry Smith MatScale_SeqAIJ, 35297d68702bSBarry Smith MatShift_SeqAIJ, 353079299369SBarry Smith MatDiagonalSet_SeqAIJ, 35316e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35333b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35343b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35353b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3536a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 353793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin NULL, 3540cda55fadSBarry Smith MatPermute_SeqAIJ, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin /* 59*/ NULL, 3543b9b97703SBarry Smith MatDestroy_SeqAIJ, 3544b9b97703SBarry Smith MatView_SeqAIJ, 3545f4259b30SLisandro Dalcin NULL, 3546f4259b30SLisandro Dalcin NULL, 3547*8bb0f5c6SPierre Jolivet /* 64*/ MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551*8bb0f5c6SPierre Jolivet MatGetRowMaxAbs_SeqAIJ, 3552*8bb0f5c6SPierre Jolivet /* 69*/ MatGetRowMinAbs_SeqAIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 35553acb8795SBarry Smith MatFDColoringApply_AIJ, 3556f4259b30SLisandro Dalcin NULL, 3557*8bb0f5c6SPierre Jolivet /* 74*/ MatFindZeroDiagonals_SeqAIJ, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561bc011b1eSHong Zhang MatLoad_SeqAIJ, 3562*8bb0f5c6SPierre Jolivet /* 79*/ NULL, 3563*8bb0f5c6SPierre Jolivet NULL, 3564*8bb0f5c6SPierre Jolivet NULL, 3565*8bb0f5c6SPierre Jolivet NULL, 3566*8bb0f5c6SPierre Jolivet NULL, 35676cff0a6bSPierre Jolivet /* 84*/ NULL, 356826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3569*8bb0f5c6SPierre Jolivet MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3570f4259b30SLisandro Dalcin NULL, 35716fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3572*8bb0f5c6SPierre Jolivet /* 90*/ NULL, 3573*8bb0f5c6SPierre Jolivet MatProductSetFromOptions_SeqAIJ, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 357687d4246cSBarry Smith MatConjugate_SeqAIJ, 3577*8bb0f5c6SPierre Jolivet /* 94*/ NULL, 3578*8bb0f5c6SPierre Jolivet MatSetValuesRow_SeqAIJ, 357999cafbc1SBarry Smith MatRealPart_SeqAIJ, 3580f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3581f4259b30SLisandro Dalcin NULL, 3582*8bb0f5c6SPierre Jolivet /* 99*/ NULL, 3583*8bb0f5c6SPierre Jolivet MatMatSolve_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 35852af78befSBarry Smith MatGetRowMin_SeqAIJ, 3586f4259b30SLisandro Dalcin NULL, 3587*8bb0f5c6SPierre Jolivet /*104*/ MatMissingDiagonal_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin NULL, 3592*8bb0f5c6SPierre Jolivet /*109*/ NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 3596*8bb0f5c6SPierre Jolivet NULL, 3597*8bb0f5c6SPierre Jolivet /*114*/ MatGetMultiProcBlock_SeqAIJ, 3598*8bb0f5c6SPierre Jolivet MatFindNonzeroRows_SeqAIJ, 3599a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360037868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36010da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3602*8bb0f5c6SPierre Jolivet /*119*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 360575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3606b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3607*8bb0f5c6SPierre Jolivet /*124*/ MatTransColoringApplySpToDen_SeqAIJ, 36082b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 36093964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3610*8bb0f5c6SPierre Jolivet NULL, 3611*8bb0f5c6SPierre Jolivet NULL, 3612*8bb0f5c6SPierre Jolivet /*129*/ MatFDColoringSetUp_SeqXAIJ, 3613*8bb0f5c6SPierre Jolivet MatFindOffBlockDiagonalEntries_SeqAIJ, 3614*8bb0f5c6SPierre Jolivet MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 3615*8bb0f5c6SPierre Jolivet MatDestroySubMatrices_SeqAIJ, 3616*8bb0f5c6SPierre Jolivet NULL, 3617*8bb0f5c6SPierre Jolivet /*134*/ NULL, 3618*8bb0f5c6SPierre Jolivet MatCreateGraph_Simple_AIJ, 3619*8bb0f5c6SPierre Jolivet MatTransposeSymbolic_SeqAIJ, 3620*8bb0f5c6SPierre Jolivet MatEliminateZeros_SeqAIJ, 3621*8bb0f5c6SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 3622f4259b30SLisandro Dalcin /*139*/ NULL, 3623f4259b30SLisandro Dalcin NULL, 3624f4259b30SLisandro Dalcin NULL, 3625fe1fc275SAlexander MatCopyHashToXAIJ_Seq_Hash}; 362617ab2063SBarry Smith 3627ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3628d71ae5a4SJacob Faibussowitsch { 3629bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 363097f1f81fSBarry Smith PetscInt i, nz, n; 3631bef8e0ddSBarry Smith 3632bef8e0ddSBarry Smith PetscFunctionBegin; 3633bef8e0ddSBarry Smith nz = aij->maxnz; 3634d0f46423SBarry Smith n = mat->rmap->n; 3635ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3636bef8e0ddSBarry Smith aij->nz = nz; 3637ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3639bef8e0ddSBarry Smith } 3640bef8e0ddSBarry Smith 3641a3bb6f32SFande Kong /* 3642ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3643ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3644ddea5d60SJunchao Zhang */ 3645d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3646d71ae5a4SJacob Faibussowitsch { 3647a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3648eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3649eec179cfSJacob Faibussowitsch PetscHashIter tpos; 365025b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 365125b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3652a3bb6f32SFande Kong 3653a3bb6f32SFande Kong PetscFunctionBegin; 3654a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36554f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3656a3bb6f32SFande Kong /* use a table */ 3657eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3658a3bb6f32SFande Kong ec = 0; 365925b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366025b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3661eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3662a3bb6f32SFande Kong if (!data) { 3663a3bb6f32SFande Kong /* one based table */ 3664c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3665a3bb6f32SFande Kong } 3666a3bb6f32SFande Kong } 3667a3bb6f32SFande Kong /* form array of columns we need */ 36689566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3669eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3670eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3671eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3672eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3673eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3674a3bb6f32SFande Kong gid--; 3675a3bb6f32SFande Kong lid--; 3676a3bb6f32SFande Kong garray[lid] = gid; 3677a3bb6f32SFande Kong } 36789566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3679eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3680c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3681a3bb6f32SFande Kong /* compact out the extra columns in B */ 368225b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368325b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3684eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3685a3bb6f32SFande Kong lid--; 368625b670f0SStefano Zampini jj[i] = lid; 3687a3bb6f32SFande Kong } 36889566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3689eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36909566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36919566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36929566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3694a3bb6f32SFande Kong } 3695a3bb6f32SFande Kong 3696bef8e0ddSBarry Smith /*@ 3697bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3698bef8e0ddSBarry Smith in the matrix. 3699bef8e0ddSBarry Smith 3700bef8e0ddSBarry Smith Input Parameters: 370111a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3702bef8e0ddSBarry Smith - indices - the column indices 3703bef8e0ddSBarry Smith 370415091d37SBarry Smith Level: advanced 370515091d37SBarry Smith 3706bef8e0ddSBarry Smith Notes: 3707bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3708bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 370911a5261eSBarry Smith of the `MatSetValues()` operation. 3710bef8e0ddSBarry Smith 3711bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371211a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3713bef8e0ddSBarry Smith 371411a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3715bef8e0ddSBarry Smith 3716b9617806SBarry Smith The indices should start with zero, not one. 3717b9617806SBarry Smith 37181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3719bef8e0ddSBarry Smith @*/ 3720d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3721d71ae5a4SJacob Faibussowitsch { 3722bef8e0ddSBarry Smith PetscFunctionBegin; 37230700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37244f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3725cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3727bef8e0ddSBarry Smith } 3728bef8e0ddSBarry Smith 3729ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3730d71ae5a4SJacob Faibussowitsch { 3731be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3732d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3733be6bf707SBarry Smith 3734be6bf707SBarry Smith PetscFunctionBegin; 373528b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3736be6bf707SBarry Smith 3737be6bf707SBarry Smith /* allocate space for values if not already there */ 37384dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3739be6bf707SBarry Smith 3740be6bf707SBarry Smith /* copy values over */ 37419566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3743be6bf707SBarry Smith } 3744be6bf707SBarry Smith 3745be6bf707SBarry Smith /*@ 374620f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3747be6bf707SBarry Smith nonlinear portion. 3748be6bf707SBarry Smith 3749c3339decSBarry Smith Logically Collect 3750be6bf707SBarry Smith 375127430b45SBarry Smith Input Parameter: 375211a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3753be6bf707SBarry Smith 375415091d37SBarry Smith Level: advanced 375515091d37SBarry Smith 37562920cce0SJacob Faibussowitsch Example Usage: 375727430b45SBarry Smith .vb 37582ef1f0ffSBarry Smith Using SNES 375927430b45SBarry Smith Create Jacobian matrix 376027430b45SBarry Smith Set linear terms into matrix 376127430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 376227430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 376327430b45SBarry Smith boundary conditions again will not change the nonzero structure 376427430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 376527430b45SBarry Smith MatStoreValues(mat); 376627430b45SBarry Smith Call SNESSetJacobian() with matrix 376727430b45SBarry Smith In your Jacobian routine 376827430b45SBarry Smith MatRetrieveValues(mat); 376927430b45SBarry Smith Set nonlinear terms in matrix 3770be6bf707SBarry Smith 377127430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 377227430b45SBarry Smith // build linear portion of Jacobian 377327430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377427430b45SBarry Smith MatStoreValues(mat); 377527430b45SBarry Smith loop over nonlinear iterations 377627430b45SBarry Smith MatRetrieveValues(mat); 377727430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 377827430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 377927430b45SBarry Smith Solve linear system with Jacobian 378027430b45SBarry Smith endloop 378127430b45SBarry Smith .ve 3782be6bf707SBarry Smith 3783be6bf707SBarry Smith Notes: 3784da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 378511a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3786be6bf707SBarry Smith calling this routine. 3787be6bf707SBarry Smith 37880c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37890c468ba9SBarry Smith and does not allocated additional space. 37900c468ba9SBarry Smith 3791fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3792be6bf707SBarry Smith @*/ 3793d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3794d71ae5a4SJacob Faibussowitsch { 3795be6bf707SBarry Smith PetscFunctionBegin; 37960700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379728b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379828b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3799cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3801be6bf707SBarry Smith } 3802be6bf707SBarry Smith 3803ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3804d71ae5a4SJacob Faibussowitsch { 3805be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3806d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3807be6bf707SBarry Smith 3808be6bf707SBarry Smith PetscFunctionBegin; 380928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381028b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3811be6bf707SBarry Smith /* copy values over */ 38129566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3814be6bf707SBarry Smith } 3815be6bf707SBarry Smith 3816be6bf707SBarry Smith /*@ 381720f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3818be6bf707SBarry Smith 3819c3339decSBarry Smith Logically Collect 3820be6bf707SBarry Smith 38212fe279fdSBarry Smith Input Parameter: 382211a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3823be6bf707SBarry Smith 382415091d37SBarry Smith Level: advanced 382515091d37SBarry Smith 38261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3827be6bf707SBarry Smith @*/ 3828d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3829d71ae5a4SJacob Faibussowitsch { 3830be6bf707SBarry Smith PetscFunctionBegin; 38310700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 383328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3834cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3836be6bf707SBarry Smith } 3837be6bf707SBarry Smith 38385d83a8b1SBarry Smith /*@ 383911a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38400d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 384120f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 384220f4b53cSBarry Smith (or the array `nnz`). 384317ab2063SBarry Smith 3844d083f849SBarry Smith Collective 3845db81eaa0SLois Curfman McInnes 384617ab2063SBarry Smith Input Parameters: 384711a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 384817ab2063SBarry Smith . m - number of rows 384917ab2063SBarry Smith . n - number of columns 385017ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385151c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38520298fd71SBarry Smith (possibly different for each row) or NULL 385317ab2063SBarry Smith 385417ab2063SBarry Smith Output Parameter: 3855416022c9SBarry Smith . A - the matrix 385617ab2063SBarry Smith 38572ef1f0ffSBarry Smith Options Database Keys: 38582ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38592ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38602ef1f0ffSBarry Smith 38612ef1f0ffSBarry Smith Level: intermediate 3862175b88e8SBarry Smith 3863b259b22eSLois Curfman McInnes Notes: 386477433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 386577433607SBarry Smith 38662ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 386749a6f317SBarry Smith 38682ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38692ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38700002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38712ef1f0ffSBarry Smith either one (as in Fortran) or zero. 387217ab2063SBarry Smith 387320f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38742ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 387520f4b53cSBarry Smith allocation. 387617ab2063SBarry Smith 3877682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38784fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3879682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38806c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38816c7ebb05SLois Curfman McInnes 38821cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 388317ab2063SBarry Smith @*/ 3884d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3885d71ae5a4SJacob Faibussowitsch { 38863a40ed3dSBarry Smith PetscFunctionBegin; 38879566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38889566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38899566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3892273d9f13SBarry Smith } 3893273d9f13SBarry Smith 38945d83a8b1SBarry Smith /*@ 3895273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3896273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3897273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3898273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3899273d9f13SBarry Smith 3900d083f849SBarry Smith Collective 3901273d9f13SBarry Smith 3902273d9f13SBarry Smith Input Parameters: 39031c4f3114SJed Brown + B - The matrix 3904273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3905273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39060298fd71SBarry Smith (possibly different for each row) or NULL 3907273d9f13SBarry Smith 39082ef1f0ffSBarry Smith Options Database Keys: 39092ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39102ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39112ef1f0ffSBarry Smith 39122ef1f0ffSBarry Smith Level: intermediate 39132ef1f0ffSBarry Smith 3914273d9f13SBarry Smith Notes: 39152ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 391649a6f317SBarry Smith 391711a5261eSBarry Smith The `MATSEQAIJ` format also called 39182ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3919273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3920273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3921273d9f13SBarry Smith 39222ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39232ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39242ef1f0ffSBarry Smith allocation. 3925273d9f13SBarry Smith 392611a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3927aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3928aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3929aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3930aa95bbe8SBarry Smith 393111a5261eSBarry Smith Developer Notes: 393211a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3933a96a251dSBarry Smith entries or columns indices 3934a96a251dSBarry Smith 3935273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3936273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3937273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3938273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3939273d9f13SBarry Smith 39401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3941db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3942273d9f13SBarry Smith @*/ 3943d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3944d71ae5a4SJacob Faibussowitsch { 3945a23d5eceSKris Buschelman PetscFunctionBegin; 39466ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39476ba663aaSJed Brown PetscValidType(B, 1); 3948cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3950a23d5eceSKris Buschelman } 3951a23d5eceSKris Buschelman 3952d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3953d71ae5a4SJacob Faibussowitsch { 3954ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39552576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395697f1f81fSBarry Smith PetscInt i; 3957273d9f13SBarry Smith 3958273d9f13SBarry Smith PetscFunctionBegin; 3959ad79cf63SBarry Smith if (B->hash_active) { 3960aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3961ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3962ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3963ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3964ad79cf63SBarry Smith } 39652576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3966a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3967c461c341SBarry Smith skipallocation = PETSC_TRUE; 3968c461c341SBarry Smith nz = 0; 3969c461c341SBarry Smith } 39709566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39719566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3972899cda47SBarry Smith 3973435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 397408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 39759f0612e4SBarry Smith if (nnz) { 3976d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 397708401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 397808401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3979b73539f3SBarry Smith } 3980b73539f3SBarry Smith } 3981b73539f3SBarry Smith 3982273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3983ab93d7beSBarry Smith if (!skipallocation) { 39844dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3985071fcb05SBarry Smith if (!b->ilen) { 3986071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39879566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3988071fcb05SBarry Smith } else { 39899566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39902ee49352SLisandro Dalcin } 3991aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3992273d9f13SBarry Smith if (!nnz) { 3993435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3994c62bd62aSJed Brown else if (nz < 0) nz = 1; 39955d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3996d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3997c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 3998273d9f13SBarry Smith } else { 3999c73702f5SBarry Smith PetscInt64 nz64 = 0; 40009371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40019371c9d4SSatish Balay b->imax[i] = nnz[i]; 40029371c9d4SSatish Balay nz64 += nnz[i]; 40039371c9d4SSatish Balay } 40049566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4005273d9f13SBarry Smith } 4006ab93d7beSBarry Smith 4007273d9f13SBarry Smith /* allocate the matrix space */ 40089566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 40099f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 40109f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 40119f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 4012396832f4SHong Zhang if (B->structure_only) { 40139f0612e4SBarry Smith b->free_a = PETSC_FALSE; 4014396832f4SHong Zhang } else { 40159f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 40169f0612e4SBarry Smith b->free_a = PETSC_TRUE; 4017396832f4SHong Zhang } 4018bfeeae90SHong Zhang b->i[0] = 0; 4019ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4020c461c341SBarry Smith } else { 4021e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4022e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4023c461c341SBarry Smith } 4024273d9f13SBarry Smith 4025846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4026846b4da1SFande Kong /* reserve user-requested sparsity */ 40279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4028846b4da1SFande Kong } 4029846b4da1SFande Kong 4030273d9f13SBarry Smith b->nz = 0; 4031273d9f13SBarry Smith b->maxnz = nz; 4032273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40331baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4034cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4035cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40365519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40375519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40385519a089SJose E. Roman */ 40395519a089SJose E. Roman B->nonzerostate++; 40403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4041273d9f13SBarry Smith } 4042273d9f13SBarry Smith 40434c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset) 4044d71ae5a4SJacob Faibussowitsch { 4045846b4da1SFande Kong Mat_SeqAIJ *a; 4046a5bbaf83SFande Kong PetscInt i; 40471f14be2bSBarry Smith PetscBool skipreset; 4048846b4da1SFande Kong 4049846b4da1SFande Kong PetscFunctionBegin; 4050846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405114d0e64fSAlex Lindsay 40524c51d546SAlexander PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()"); 40534c51d546SAlexander if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS); 40544c51d546SAlexander 405514d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40563ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 405714d0e64fSAlex Lindsay 4058846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40592c814fdeSFande Kong /* if no saved info, we error out */ 406028b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40612c814fdeSFande Kong 40621f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation "); 40632c814fdeSFande Kong 40641f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40654c51d546SAlexander if (skipreset) PetscCall(MatZeroEntries(A)); 40664c51d546SAlexander else { 40679566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40689566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4069846b4da1SFande Kong a->i[0] = 0; 4070ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4071846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4072846b4da1SFande Kong a->nz = 0; 4073846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4074846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4075846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4076846b4da1SFande Kong A->assembled = PETSC_FALSE; 4077b3a35320SAlex Lindsay A->nonzerostate++; 4078b3a35320SAlex Lindsay /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */ 4079b3a35320SAlex Lindsay PetscCall(PetscObjectStateIncrease((PetscObject)A)); 40801f14be2bSBarry Smith } 40814c51d546SAlexander if (memoryreset) *memoryreset = (PetscBool)!skipreset; 40824c51d546SAlexander PetscFunctionReturn(PETSC_SUCCESS); 40834c51d546SAlexander } 40844c51d546SAlexander 40854c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 40864c51d546SAlexander { 40874c51d546SAlexander PetscFunctionBegin; 40884c51d546SAlexander PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL)); 40893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4090846b4da1SFande Kong } 4091846b4da1SFande Kong 409258d36128SBarry Smith /*@ 409311a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4094a1661176SMatthew Knepley 4095a1661176SMatthew Knepley Input Parameters: 4096a1661176SMatthew Knepley + B - the matrix 4097d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4098d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4099d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4100a1661176SMatthew Knepley 4101a1661176SMatthew Knepley Level: developer 4102a1661176SMatthew Knepley 41036a9b8d82SBarry Smith Notes: 41042ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 410558d36128SBarry Smith 41066a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41076a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41086a9b8d82SBarry Smith 41096a9b8d82SBarry Smith Developer Notes: 41102ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41112ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41126a9b8d82SBarry Smith 411311a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41146a9b8d82SBarry Smith 4115fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4116a1661176SMatthew Knepley @*/ 4117d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4118d71ae5a4SJacob Faibussowitsch { 4119a1661176SMatthew Knepley PetscFunctionBegin; 41200700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41216ba663aaSJed Brown PetscValidType(B, 1); 4122cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4124a1661176SMatthew Knepley } 4125a1661176SMatthew Knepley 4126ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4127d71ae5a4SJacob Faibussowitsch { 4128a1661176SMatthew Knepley PetscInt i; 4129a1661176SMatthew Knepley PetscInt m, n; 4130a1661176SMatthew Knepley PetscInt nz; 41316a9b8d82SBarry Smith PetscInt *nnz; 4132a1661176SMatthew Knepley 4133a1661176SMatthew Knepley PetscFunctionBegin; 4134aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4135779a8d59SSatish Balay 41369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4138779a8d59SSatish Balay 41399566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4141a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4142b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 414308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4144a1661176SMatthew Knepley nnz[i] = nz; 4145a1661176SMatthew Knepley } 41469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41479566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4148a1661176SMatthew Knepley 41498e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4150a1661176SMatthew Knepley 41519566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41529566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4153a1661176SMatthew Knepley 41549566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4156a1661176SMatthew Knepley } 4157a1661176SMatthew Knepley 4158ad7e164aSPierre Jolivet /*@ 41592ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4160ad7e164aSPierre Jolivet 4161ad7e164aSPierre Jolivet Input Parameters: 4162ad7e164aSPierre Jolivet + A - left-hand side matrix 4163ad7e164aSPierre Jolivet . B - right-hand side matrix 416411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4165ad7e164aSPierre Jolivet 4166ad7e164aSPierre Jolivet Output Parameter: 41672ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4168ad7e164aSPierre Jolivet 4169ad7e164aSPierre Jolivet Level: intermediate 4170ad7e164aSPierre Jolivet 417111a5261eSBarry Smith Note: 417211a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4173ad7e164aSPierre Jolivet 41741cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4175ad7e164aSPierre Jolivet @*/ 4176d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4177d71ae5a4SJacob Faibussowitsch { 4178ad7e164aSPierre Jolivet PetscFunctionBegin; 4179ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4180ad7e164aSPierre Jolivet PetscValidType(A, 1); 4181ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4182ad7e164aSPierre Jolivet PetscValidType(B, 2); 41834f572ea9SToby Isaac PetscAssertPointer(C, 4); 4184ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4185ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4186ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4187ad7e164aSPierre Jolivet } 4188cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4190ad7e164aSPierre Jolivet } 4191ad7e164aSPierre Jolivet 4192ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4193d71ae5a4SJacob Faibussowitsch { 4194ad7e164aSPierre Jolivet Mat newmat; 4195ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4196ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4197ad7e164aSPierre Jolivet PetscScalar *v; 4198fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4199ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4200ad7e164aSPierre Jolivet PetscBool flg; 4201ad7e164aSPierre Jolivet 4202ad7e164aSPierre Jolivet PetscFunctionBegin; 420328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420428b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 420528b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420628b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42079566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 420828b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4209aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4210ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42119566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42129566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42139566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42149566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4215ad7e164aSPierre Jolivet i[0] = 0; 4216ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4217ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4218ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4219ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4220ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4221ad7e164aSPierre Jolivet } 4222ad7e164aSPierre Jolivet } 4223ad7e164aSPierre Jolivet } 42249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4225ad7e164aSPierre Jolivet *C = newmat; 42269566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4227ad7e164aSPierre Jolivet nnz = 0; 4228ad7e164aSPierre Jolivet } 42299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4232ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4233ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4234ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4235ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4236ad7e164aSPierre Jolivet } 4237ad7e164aSPierre Jolivet } 4238ad7e164aSPierre Jolivet } 42399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4243ad7e164aSPierre Jolivet } 4244ad7e164aSPierre Jolivet 4245c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4246af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4247170fe5c8SBarry Smith 4248170fe5c8SBarry Smith /* 4249170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4250170fe5c8SBarry Smith 4251170fe5c8SBarry Smith n p p 42522da392ccSBarry Smith [ ] [ ] [ ] 42532da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42542da392ccSBarry Smith [ ] [ ] [ ] 4255170fe5c8SBarry Smith 4256170fe5c8SBarry Smith */ 4257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4258d71ae5a4SJacob Faibussowitsch { 4259170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4260170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4261170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 426286214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4263170fe5c8SBarry Smith const PetscInt *ii, *idx; 4264170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4265170fe5c8SBarry Smith PetscScalar *c, *c_q; 426686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 426786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4268170fe5c8SBarry Smith 4269170fe5c8SBarry Smith PetscFunctionBegin; 4270d0f46423SBarry Smith m = A->rmap->n; 4271d0f46423SBarry Smith n = A->cmap->n; 4272d0f46423SBarry Smith p = B->cmap->n; 4273170fe5c8SBarry Smith a = sub_a->v; 4274170fe5c8SBarry Smith b = sub_b->a; 4275170fe5c8SBarry Smith c = sub_c->v; 427686214ceeSStefano Zampini if (clda == m) { 42779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 427886214ceeSStefano Zampini } else { 427986214ceeSStefano Zampini for (j = 0; j < p; j++) 42809371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 428186214ceeSStefano Zampini } 4282170fe5c8SBarry Smith ii = sub_b->i; 4283170fe5c8SBarry Smith idx = sub_b->j; 4284170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4285170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4286170fe5c8SBarry Smith while (q-- > 0) { 428786214ceeSStefano Zampini c_q = c + clda * (*idx); 428886214ceeSStefano Zampini a_q = a + alda * i; 4289854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4290170fe5c8SBarry Smith idx++; 4291170fe5c8SBarry Smith b++; 4292170fe5c8SBarry Smith } 4293170fe5c8SBarry Smith } 42943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4295170fe5c8SBarry Smith } 4296170fe5c8SBarry Smith 4297d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4298d71ae5a4SJacob Faibussowitsch { 4299d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 430086214ceeSStefano Zampini PetscBool cisdense; 4301170fe5c8SBarry Smith 4302170fe5c8SBarry Smith PetscFunctionBegin; 430308401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43049566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43059566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4306d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 430748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43089566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4309d73949e8SHong Zhang 43104222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4312170fe5c8SBarry Smith } 4313170fe5c8SBarry Smith 43140bad9183SKris Buschelman /*MC 4315fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43160bad9183SKris Buschelman based on compressed sparse row format. 43170bad9183SKris Buschelman 43182ef1f0ffSBarry Smith Options Database Key: 43190bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43200bad9183SKris Buschelman 43210bad9183SKris Buschelman Level: beginner 43220bad9183SKris Buschelman 43230cd7f59aSBarry Smith Notes: 43242ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43250cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43260cd7f59aSBarry Smith in the matrix 43270cd7f59aSBarry Smith 432811a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 432911a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43300cd7f59aSBarry Smith 433111a5261eSBarry Smith Developer Note: 43322ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43330cd7f59aSBarry Smith 43341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43350bad9183SKris Buschelman M*/ 43360bad9183SKris Buschelman 4337ccd284c7SBarry Smith /*MC 4338ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4339ccd284c7SBarry Smith 434011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 434111a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 434211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4343ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4344ccd284c7SBarry Smith the above preallocation routines for simplicity. 4345ccd284c7SBarry Smith 43462ef1f0ffSBarry Smith Options Database Key: 434711a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4348ccd284c7SBarry Smith 43492ef1f0ffSBarry Smith Level: beginner 43502ef1f0ffSBarry Smith 435111a5261eSBarry Smith Note: 435211a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4353ccd284c7SBarry Smith enough exist. 4354ccd284c7SBarry Smith 43551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4356ccd284c7SBarry Smith M*/ 4357ccd284c7SBarry Smith 4358ccd284c7SBarry Smith /*MC 4359ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4360ccd284c7SBarry Smith 43612ef1f0ffSBarry Smith Options Database Key: 43622ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43632ef1f0ffSBarry Smith 43642ef1f0ffSBarry Smith Level: beginner 43652ef1f0ffSBarry Smith 43662ef1f0ffSBarry Smith Note: 436711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 436811a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 436911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4370ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4371ccd284c7SBarry Smith the above preallocation routines for simplicity. 4372ccd284c7SBarry Smith 43731cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4374ccd284c7SBarry Smith M*/ 4375ccd284c7SBarry Smith 43767906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43777906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43787906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43797906f579SHong Zhang #endif 4380d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4381d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4382d24d4204SJose E. Roman #endif 43837906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43847906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43857906f579SHong Zhang #endif 43867906f579SHong Zhang 4387d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4388c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43894222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43907906f579SHong Zhang 43918c778c55SBarry Smith /*@C 439211a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43938c778c55SBarry Smith 43948c778c55SBarry Smith Not Collective 43958c778c55SBarry Smith 43968c778c55SBarry Smith Input Parameter: 4397fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43988c778c55SBarry Smith 43998c778c55SBarry Smith Output Parameter: 44008c778c55SBarry Smith . array - pointer to the data 44018c778c55SBarry Smith 44028c778c55SBarry Smith Level: intermediate 44038c778c55SBarry Smith 4404ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()` 44058c778c55SBarry Smith @*/ 44065d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4407d71ae5a4SJacob Faibussowitsch { 4408d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44098c778c55SBarry Smith 44108c778c55SBarry Smith PetscFunctionBegin; 4411d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44129566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4413d67d9f35SJunchao Zhang } else { 4414d67d9f35SJunchao Zhang *array = aij->a; 4415d67d9f35SJunchao Zhang } 44163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4417d67d9f35SJunchao Zhang } 4418d67d9f35SJunchao Zhang 4419d67d9f35SJunchao Zhang /*@C 442011a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4421d67d9f35SJunchao Zhang 4422d67d9f35SJunchao Zhang Not Collective 4423d67d9f35SJunchao Zhang 4424d67d9f35SJunchao Zhang Input Parameters: 4425fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4426d67d9f35SJunchao Zhang - array - pointer to the data 4427d67d9f35SJunchao Zhang 4428d67d9f35SJunchao Zhang Level: intermediate 4429d67d9f35SJunchao Zhang 4430ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()` 4431d67d9f35SJunchao Zhang @*/ 44325d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4433d71ae5a4SJacob Faibussowitsch { 4434d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4435d67d9f35SJunchao Zhang 4436d67d9f35SJunchao Zhang PetscFunctionBegin; 4437d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44389566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4439d67d9f35SJunchao Zhang } else { 4440d67d9f35SJunchao Zhang *array = NULL; 4441d67d9f35SJunchao Zhang } 44429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44439566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44458c778c55SBarry Smith } 44468c778c55SBarry Smith 444721e72a00SBarry Smith /*@C 444811a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44498f1ea47aSStefano Zampini 44500ab4885dSBarry Smith Not Collective; No Fortran Support 44518f1ea47aSStefano Zampini 44528f1ea47aSStefano Zampini Input Parameter: 4453fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44548f1ea47aSStefano Zampini 44558f1ea47aSStefano Zampini Output Parameter: 44568f1ea47aSStefano Zampini . array - pointer to the data 44578f1ea47aSStefano Zampini 44588f1ea47aSStefano Zampini Level: intermediate 44598f1ea47aSStefano Zampini 44601cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44618f1ea47aSStefano Zampini @*/ 44625d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4463d71ae5a4SJacob Faibussowitsch { 4464d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44658f1ea47aSStefano Zampini 44668f1ea47aSStefano Zampini PetscFunctionBegin; 4467d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44689566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4469d67d9f35SJunchao Zhang } else { 4470d67d9f35SJunchao Zhang *array = aij->a; 4471d67d9f35SJunchao Zhang } 44723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44738f1ea47aSStefano Zampini } 44748f1ea47aSStefano Zampini 44758f1ea47aSStefano Zampini /*@C 447611a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44778f1ea47aSStefano Zampini 44780ab4885dSBarry Smith Not Collective; No Fortran Support 44798f1ea47aSStefano Zampini 44808f1ea47aSStefano Zampini Input Parameter: 4481fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44828f1ea47aSStefano Zampini 44838f1ea47aSStefano Zampini Output Parameter: 44848f1ea47aSStefano Zampini . array - pointer to the data 44858f1ea47aSStefano Zampini 44868f1ea47aSStefano Zampini Level: intermediate 44878f1ea47aSStefano Zampini 44881cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44898f1ea47aSStefano Zampini @*/ 44905d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4491d71ae5a4SJacob Faibussowitsch { 4492d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44938f1ea47aSStefano Zampini 44948f1ea47aSStefano Zampini PetscFunctionBegin; 4495d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44969566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4497d67d9f35SJunchao Zhang } else { 4498d67d9f35SJunchao Zhang *array = NULL; 4499d67d9f35SJunchao Zhang } 45003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4501d67d9f35SJunchao Zhang } 4502d67d9f35SJunchao Zhang 4503d67d9f35SJunchao Zhang /*@C 450411a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4505d67d9f35SJunchao Zhang 45060ab4885dSBarry Smith Not Collective; No Fortran Support 4507d67d9f35SJunchao Zhang 4508d67d9f35SJunchao Zhang Input Parameter: 4509fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4510d67d9f35SJunchao Zhang 4511d67d9f35SJunchao Zhang Output Parameter: 4512d67d9f35SJunchao Zhang . array - pointer to the data 4513d67d9f35SJunchao Zhang 4514d67d9f35SJunchao Zhang Level: intermediate 4515d67d9f35SJunchao Zhang 45161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4517d67d9f35SJunchao Zhang @*/ 45185d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4519d71ae5a4SJacob Faibussowitsch { 4520d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4521d67d9f35SJunchao Zhang 4522d67d9f35SJunchao Zhang PetscFunctionBegin; 4523d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45249566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4525d67d9f35SJunchao Zhang } else { 4526d67d9f35SJunchao Zhang *array = aij->a; 4527d67d9f35SJunchao Zhang } 45289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45299566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4531d67d9f35SJunchao Zhang } 4532d67d9f35SJunchao Zhang 4533d67d9f35SJunchao Zhang /*@C 4534d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4535d67d9f35SJunchao Zhang 45360ab4885dSBarry Smith Not Collective; No Fortran Support 4537d67d9f35SJunchao Zhang 4538d67d9f35SJunchao Zhang Input Parameter: 4539fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4540d67d9f35SJunchao Zhang 4541d67d9f35SJunchao Zhang Output Parameter: 4542d67d9f35SJunchao Zhang . array - pointer to the data 4543d67d9f35SJunchao Zhang 4544d67d9f35SJunchao Zhang Level: intermediate 4545d67d9f35SJunchao Zhang 45461cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4547d67d9f35SJunchao Zhang @*/ 45485d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4549d71ae5a4SJacob Faibussowitsch { 4550d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4551d67d9f35SJunchao Zhang 4552d67d9f35SJunchao Zhang PetscFunctionBegin; 4553d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45549566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4555d67d9f35SJunchao Zhang } else { 4556d67d9f35SJunchao Zhang *array = NULL; 4557d67d9f35SJunchao Zhang } 45583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45598f1ea47aSStefano Zampini } 45608f1ea47aSStefano Zampini 45618f1ea47aSStefano Zampini /*@C 456211a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45637ee59b9bSJunchao Zhang 45640ab4885dSBarry Smith Not Collective; No Fortran Support 45657ee59b9bSJunchao Zhang 45667ee59b9bSJunchao Zhang Input Parameter: 456711a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45687ee59b9bSJunchao Zhang 45697ee59b9bSJunchao Zhang Output Parameters: 45707ee59b9bSJunchao Zhang + i - row map array of the matrix 45717ee59b9bSJunchao Zhang . j - column index array of the matrix 45727ee59b9bSJunchao Zhang . a - data array of the matrix 4573fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45747ee59b9bSJunchao Zhang 4575fe59aa6dSJacob Faibussowitsch Level: developer 45762ef1f0ffSBarry Smith 45777ee59b9bSJunchao Zhang Notes: 45782ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45797ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45807ee59b9bSJunchao Zhang 45817ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45822ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45837ee59b9bSJunchao Zhang 45841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45857ee59b9bSJunchao Zhang @*/ 45865d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4587d71ae5a4SJacob Faibussowitsch { 45887ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45897ee59b9bSJunchao Zhang 45907ee59b9bSJunchao Zhang PetscFunctionBegin; 45917ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45927ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45937ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45947ee59b9bSJunchao Zhang } else { 45957ee59b9bSJunchao Zhang if (i) *i = aij->i; 45967ee59b9bSJunchao Zhang if (j) *j = aij->j; 45977ee59b9bSJunchao Zhang if (a) *a = aij->a; 45987ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45997ee59b9bSJunchao Zhang } 46003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46017ee59b9bSJunchao Zhang } 46027ee59b9bSJunchao Zhang 4603cc4c1da9SBarry Smith /*@ 460421e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 460521e72a00SBarry Smith 460621e72a00SBarry Smith Not Collective 460721e72a00SBarry Smith 460821e72a00SBarry Smith Input Parameter: 4609fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 461021e72a00SBarry Smith 461121e72a00SBarry Smith Output Parameter: 461221e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 461321e72a00SBarry Smith 461421e72a00SBarry Smith Level: intermediate 461521e72a00SBarry Smith 4616ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()` 461721e72a00SBarry Smith @*/ 4618d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4619d71ae5a4SJacob Faibussowitsch { 462021e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 462121e72a00SBarry Smith 462221e72a00SBarry Smith PetscFunctionBegin; 462321e72a00SBarry Smith *nz = aij->rmax; 46243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 462521e72a00SBarry Smith } 462621e72a00SBarry Smith 462749abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data) 46282c4ab24aSJunchao Zhang { 462949abdd8aSBarry Smith MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data; 46304d86920dSPierre Jolivet 46312c4ab24aSJunchao Zhang PetscFunctionBegin; 46322c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46332c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46342c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46352c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46362c4ab24aSJunchao Zhang } 46372c4ab24aSJunchao Zhang 4638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4639d71ae5a4SJacob Faibussowitsch { 4640394ed5ebSJunchao Zhang MPI_Comm comm; 4641394ed5ebSJunchao Zhang PetscInt *i, *j; 46420d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4643394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4644394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4645394ed5ebSJunchao Zhang PetscInt *Aj; 4646394ed5ebSJunchao Zhang PetscScalar *Aa; 4647f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4648cbc6b225SStefano Zampini MatType rtype; 4649394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46502c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46510d88f7f4SJunchao Zhang PetscBool isorted; 46529f0612e4SBarry Smith PetscBool hypre; 46539f0612e4SBarry Smith const char *name; 4654394ed5ebSJunchao Zhang 4655394ed5ebSJunchao Zhang PetscFunctionBegin; 46569566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46579566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4658e8729f6fSJunchao Zhang i = coo_i; 4659e8729f6fSJunchao Zhang j = coo_j; 46609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46610d88f7f4SJunchao Zhang 46620d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46630d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46640d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46650d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4666394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46670d88f7f4SJunchao Zhang if (isorted) { 46680d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46690d88f7f4SJunchao Zhang else iprev = i[k]; 46700d88f7f4SJunchao Zhang } 4671394ed5ebSJunchao Zhang perm[k] = k; 4672394ed5ebSJunchao Zhang } 4673394ed5ebSJunchao Zhang 46740d88f7f4SJunchao Zhang /* Sort by row if not already */ 46750d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4676651b1cf9SStefano Zampini 4677651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4678651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46799371c9d4SSatish Balay if (i[k] >= 0) break; 4680394ed5ebSJunchao Zhang nneg = k; 46819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4682394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 468335cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4684394ed5ebSJunchao Zhang 46859f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 46869f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 46879f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4688394ed5ebSJunchao Zhang 4689651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4690651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4691651b1cf9SStefano Zampini 4692394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 469335cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4694394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4695394ed5ebSJunchao Zhang while (k < coo_n) { 46960d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 46970d88f7f4SJunchao Zhang PetscInt jprev; 46980d88f7f4SJunchao Zhang 46990d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4700394ed5ebSJunchao Zhang row = i[k]; 47010d88f7f4SJunchao Zhang start = k; 47020d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47030d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47040d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47050d88f7f4SJunchao Zhang if (strictly_sorted) { 47060d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47070d88f7f4SJunchao Zhang else jprev = j[k]; 47080d88f7f4SJunchao Zhang } 47090d88f7f4SJunchao Zhang k++; 47100d88f7f4SJunchao Zhang } 4711394ed5ebSJunchao Zhang end = k; 47120d88f7f4SJunchao Zhang 4713651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4714651b1cf9SStefano Zampini if (hypre) { 47151690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4716651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47170d88f7f4SJunchao Zhang 47180d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47190d88f7f4SJunchao Zhang PetscCount tmp; 47200d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47210d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47221c265611SJunchao Zhang j[p] = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[]) 47230d88f7f4SJunchao Zhang j[start] = row; 47240d88f7f4SJunchao Zhang tmp = perm[start]; 47251c265611SJunchao Zhang perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below 47260d88f7f4SJunchao Zhang perm[p] = tmp; 47270d88f7f4SJunchao Zhang break; 47280d88f7f4SJunchao Zhang } 47290d88f7f4SJunchao Zhang } 47300d88f7f4SJunchao Zhang } else { 4731651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4732651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4733651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4734651b1cf9SStefano Zampini } 47350d88f7f4SJunchao Zhang 4736651b1cf9SStefano Zampini if (hasdiag) { 4737651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4738651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4739651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4740651b1cf9SStefano Zampini } 4741651b1cf9SStefano Zampini } 4742651b1cf9SStefano Zampini } 47430d88f7f4SJunchao Zhang } 47441c265611SJunchao Zhang // sort by columns in a row. perm[] indicates their original order 47450d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4746651b1cf9SStefano Zampini 47470d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47480d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47490d88f7f4SJunchao Zhang Aj[q] = j[p]; 47500d88f7f4SJunchao Zhang jmap[q] = 1; 47510d88f7f4SJunchao Zhang } 47526497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 47530d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47540d88f7f4SJunchao Zhang } else { 4755394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4756394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4757651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4758394ed5ebSJunchao Zhang Ai[row] = 1; 4759394ed5ebSJunchao Zhang nnz++; 4760394ed5ebSJunchao Zhang 4761394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4762394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4763394ed5ebSJunchao Zhang q++; 4764394ed5ebSJunchao Zhang jmap[q] = 1; 4765394ed5ebSJunchao Zhang Aj[q] = j[p]; 4766394ed5ebSJunchao Zhang Ai[row]++; 4767394ed5ebSJunchao Zhang nnz++; 4768394ed5ebSJunchao Zhang } else { 4769394ed5ebSJunchao Zhang jmap[q]++; 4770394ed5ebSJunchao Zhang } 4771394ed5ebSJunchao Zhang } 4772394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4773394ed5ebSJunchao Zhang } 47740d88f7f4SJunchao Zhang } 47750d88f7f4SJunchao Zhang 4776394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4777394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47780d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4779394ed5ebSJunchao Zhang jmap[0] = 0; 4780394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47810d88f7f4SJunchao Zhang 47829f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4783394ed5ebSJunchao Zhang PetscCount *jmap_new; 4784394ed5ebSJunchao Zhang PetscInt *Aj_new; 4785394ed5ebSJunchao Zhang 47869566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47879566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47889566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4789394ed5ebSJunchao Zhang jmap = jmap_new; 4790394ed5ebSJunchao Zhang 47919f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 47929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47939f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4794394ed5ebSJunchao Zhang Aj = Aj_new; 4795394ed5ebSJunchao Zhang } 4796394ed5ebSJunchao Zhang 4797394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4798394ed5ebSJunchao Zhang PetscCount *perm_new; 4799cbc6b225SStefano Zampini 48009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48029566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4803394ed5ebSJunchao Zhang perm = perm_new; 4804394ed5ebSJunchao Zhang } 4805394ed5ebSJunchao Zhang 48069566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48079f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 48089f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 48099566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4810394ed5ebSJunchao Zhang 4811394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48122c4ab24aSJunchao Zhang 48132c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48142c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48156497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 48162c4ab24aSJunchao Zhang coo->n = coo_n; 48172c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48182c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48192c4ab24aSJunchao Zhang coo->perm = perm; 482003e76207SPierre Jolivet PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ)); 48213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4822394ed5ebSJunchao Zhang } 4823394ed5ebSJunchao Zhang 4824d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4825d71ae5a4SJacob Faibussowitsch { 4826394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4827394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48282c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4829394ed5ebSJunchao Zhang PetscScalar *Aa; 48302c4ab24aSJunchao Zhang PetscContainer container; 48312c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4832394ed5ebSJunchao Zhang 4833394ed5ebSJunchao Zhang PetscFunctionBegin; 48342c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48352c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48362c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48372c4ab24aSJunchao Zhang perm = coo->perm; 48382c4ab24aSJunchao Zhang jmap = coo->jmap; 48399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4840394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4841b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4842b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4843b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4844394ed5ebSJunchao Zhang } 48459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4847394ed5ebSJunchao Zhang } 4848394ed5ebSJunchao Zhang 484934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48505063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 485102fe1965SBarry Smith #endif 4852d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4853d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4854d5e393b6SSuyash Tandon #endif 48553d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48565063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48573d0639e7SStefano Zampini #endif 485802fe1965SBarry Smith 4859d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4860d71ae5a4SJacob Faibussowitsch { 4861273d9f13SBarry Smith Mat_SeqAIJ *b; 486238baddfdSBarry Smith PetscMPIInt size; 4863273d9f13SBarry Smith 4864273d9f13SBarry Smith PetscFunctionBegin; 48659566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 486608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4867273d9f13SBarry Smith 48684dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48692205254eSKarl Rupp 4870b0a32e0cSBarry Smith B->data = (void *)b; 4871aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4872071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48732205254eSKarl Rupp 4874f4259b30SLisandro Dalcin b->row = NULL; 4875f4259b30SLisandro Dalcin b->col = NULL; 4876f4259b30SLisandro Dalcin b->icol = NULL; 4877b810aeb4SBarry Smith b->reallocs = 0; 487836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4879f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4880416022c9SBarry Smith b->nonew = 0; 4881f4259b30SLisandro Dalcin b->diag = NULL; 4882f4259b30SLisandro Dalcin b->solve_work = NULL; 4883f4259b30SLisandro Dalcin B->spptr = NULL; 4884f4259b30SLisandro Dalcin b->saved_values = NULL; 4885f4259b30SLisandro Dalcin b->idiag = NULL; 4886f4259b30SLisandro Dalcin b->mdiag = NULL; 4887f4259b30SLisandro Dalcin b->ssor_work = NULL; 488871f1c65dSBarry Smith b->omega = 1.0; 488971f1c65dSBarry Smith b->fshift = 0.0; 489071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4891bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4892a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 489317ab2063SBarry Smith 48949566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4895d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4898b3866ffcSBarry Smith #endif 48999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49069779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4908191b95cbSRichard Tran Mills #endif 490934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 491302fe1965SBarry Smith #endif 4914d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4915d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4916d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4917d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4918d5e393b6SSuyash Tandon #endif 49193d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49213d0639e7SStefano Zampini #endif 49229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4923af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4925af8000cdSHong Zhang #endif 4926d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4928d24d4204SJose E. Roman #endif 492963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 493263c07aadSStefano Zampini #endif 49339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 493714e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 4940674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ)); 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49499566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 495317ab2063SBarry Smith } 495417ab2063SBarry Smith 4955b24902e0SBarry Smith /* 49563893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4957b24902e0SBarry Smith */ 4958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4959d71ae5a4SJacob Faibussowitsch { 49602a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4961071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 496217ab2063SBarry Smith 49633a40ed3dSBarry Smith PetscFunctionBegin; 4964aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4965273d9f13SBarry Smith 4966d5f3da31SBarry Smith C->factortype = A->factortype; 4967f4259b30SLisandro Dalcin c->row = NULL; 4968f4259b30SLisandro Dalcin c->col = NULL; 4969f4259b30SLisandro Dalcin c->icol = NULL; 49706ad4291fSHong Zhang c->reallocs = 0; 4971bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 497217ab2063SBarry Smith 497369272f91SPierre Jolivet C->assembled = A->assembled; 497417ab2063SBarry Smith 497569272f91SPierre Jolivet if (A->preallocated) { 49769566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49779566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4978eec197d1SBarry Smith 497931fe6a7dSBarry Smith if (!A->hash_active) { 49809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49819566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49839566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 498417ab2063SBarry Smith 498517ab2063SBarry Smith /* allocate the matrix space */ 4986f77e22a1SHong Zhang if (mallocmatspace) { 49879f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 49889f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 49899f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 49909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 49919f0612e4SBarry Smith c->free_a = PETSC_TRUE; 49929f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 499317ab2063SBarry Smith if (m > 0) { 49949566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4995be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49962e5835c6SStefano Zampini const PetscScalar *aa; 49972e5835c6SStefano Zampini 49989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5001be6bf707SBarry Smith } else { 50029566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 500317ab2063SBarry Smith } 500408480c60SBarry Smith } 5005f77e22a1SHong Zhang } 500631fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 500731fe6a7dSBarry Smith } else { 500831fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 500931fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 501031fe6a7dSBarry Smith } 501117ab2063SBarry Smith 50126ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5013416022c9SBarry Smith c->roworiented = a->roworiented; 5014416022c9SBarry Smith c->nonew = a->nonew; 5015416022c9SBarry Smith if (a->diag) { 50169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50179566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5018071fcb05SBarry Smith } else c->diag = NULL; 50192205254eSKarl Rupp 5020f4259b30SLisandro Dalcin c->solve_work = NULL; 5021f4259b30SLisandro Dalcin c->saved_values = NULL; 5022f4259b30SLisandro Dalcin c->idiag = NULL; 5023f4259b30SLisandro Dalcin c->ssor_work = NULL; 5024a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 50256ad4291fSHong Zhang 5026893ad86cSHong Zhang c->rmax = a->rmax; 5027416022c9SBarry Smith c->nz = a->nz; 50288ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5029754ec7b1SSatish Balay 50306ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50316ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5032cd6b891eSBarry Smith if (a->compressedrow.use) { 50336ad4291fSHong Zhang i = a->compressedrow.nrows; 50349566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50369566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 503727ea64f8SHong Zhang } else { 503827ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50390298fd71SBarry Smith c->compressedrow.i = NULL; 50400298fd71SBarry Smith c->compressedrow.rindex = NULL; 50416ad4291fSHong Zhang } 5042ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5043e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50444846f1f5SKris Buschelman 50459566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 504669272f91SPierre Jolivet } 50479566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 504917ab2063SBarry Smith } 505017ab2063SBarry Smith 5051d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5052d71ae5a4SJacob Faibussowitsch { 5053b24902e0SBarry Smith PetscFunctionBegin; 50549566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50559566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 505648a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50579566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50589566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5060b24902e0SBarry Smith } 5061b24902e0SBarry Smith 5062d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5063d71ae5a4SJacob Faibussowitsch { 506452f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 506552f91c60SVaclav Hapla 506652f91c60SVaclav Hapla PetscFunctionBegin; 506752f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 506852f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5069c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50709566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50719566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50729566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 507352f91c60SVaclav Hapla if (isbinary) { 50749566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 507552f91c60SVaclav Hapla } else if (ishdf5) { 507652f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50779566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 507852f91c60SVaclav Hapla #else 507952f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 508052f91c60SVaclav Hapla #endif 508152f91c60SVaclav Hapla } else { 508298921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 508352f91c60SVaclav Hapla } 50843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 508552f91c60SVaclav Hapla } 508652f91c60SVaclav Hapla 5087d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5088d71ae5a4SJacob Faibussowitsch { 50893ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50903ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5091fbdbba38SShri Abhyankar 5092fbdbba38SShri Abhyankar PetscFunctionBegin; 50939566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5094bbead8a2SBarry Smith 50953ea6fe3dSLisandro Dalcin /* read in matrix header */ 50969566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 509708401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50989371c9d4SSatish Balay M = header[1]; 50999371c9d4SSatish Balay N = header[2]; 51009371c9d4SSatish Balay nz = header[3]; 510108401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 510208401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 510308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5104fbdbba38SShri Abhyankar 51053ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51069566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51073ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51083ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51093ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51103ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51113ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51129566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51139566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51143ea6fe3dSLisandro Dalcin 51153ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51169566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5117aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51183ea6fe3dSLisandro Dalcin 5119fbdbba38SShri Abhyankar /* read in row lengths */ 51209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51219566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51223ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51239371c9d4SSatish Balay sum = 0; 51249371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 512508401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51263ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51289566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5129aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51303ea6fe3dSLisandro Dalcin /* store row lengths */ 51319566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51329566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5133fbdbba38SShri Abhyankar 51343ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51359371c9d4SSatish Balay a->i[0] = 0; 51369371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51373ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51389566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51393ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51409566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5141fbdbba38SShri Abhyankar 51429566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51439566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5145fbdbba38SShri Abhyankar } 5146fbdbba38SShri Abhyankar 5147d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5148d71ae5a4SJacob Faibussowitsch { 51497264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5150fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5151eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5152eeffb40dSHong Zhang PetscInt k; 5153eeffb40dSHong Zhang #endif 51547264ac53SSatish Balay 51553a40ed3dSBarry Smith PetscFunctionBegin; 5156bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5157d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5158ca44d042SBarry Smith *flg = PETSC_FALSE; 51593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5160bcd2baecSBarry Smith } 51617264ac53SSatish Balay 51627264ac53SSatish Balay /* if the a->i are the same */ 51639566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51643ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51657264ac53SSatish Balay 51667264ac53SSatish Balay /* if a->j are the same */ 51679566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51683ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5169bcd2baecSBarry Smith 51709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5172bcd2baecSBarry Smith /* if a->a are the same */ 5173eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5174eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5175fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5176eeffb40dSHong Zhang *flg = PETSC_FALSE; 51773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5178eeffb40dSHong Zhang } 5179eeffb40dSHong Zhang } 5180eeffb40dSHong Zhang #else 51819566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5182eeffb40dSHong Zhang #endif 51839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51867264ac53SSatish Balay } 518736db0b34SBarry Smith 518805869f15SSatish Balay /*@ 518911a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 519036db0b34SBarry Smith provided by the user. 519136db0b34SBarry Smith 5192d083f849SBarry Smith Collective 519336db0b34SBarry Smith 519436db0b34SBarry Smith Input Parameters: 519536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 519636db0b34SBarry Smith . m - number of rows 519736db0b34SBarry Smith . n - number of columns 5198483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 519936db0b34SBarry Smith . j - column indices 520036db0b34SBarry Smith - a - matrix values 520136db0b34SBarry Smith 520236db0b34SBarry Smith Output Parameter: 520336db0b34SBarry Smith . mat - the matrix 520436db0b34SBarry Smith 520536db0b34SBarry Smith Level: intermediate 520636db0b34SBarry Smith 520736db0b34SBarry Smith Notes: 52082ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5209292fb18eSBarry Smith once the matrix is destroyed and not before 521036db0b34SBarry Smith 521136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 521236db0b34SBarry Smith 52132ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 521436db0b34SBarry Smith 5215a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5216a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52178eef79e4SBarry Smith as shown 52182ef1f0ffSBarry Smith .vb 52192ef1f0ffSBarry Smith 1 0 0 52202ef1f0ffSBarry Smith 2 0 3 52212ef1f0ffSBarry Smith 4 5 6 5222a4552177SSatish Balay 52232ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52242ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52252ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52262ef1f0ffSBarry Smith .ve 5227a4552177SSatish Balay 52281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 522936db0b34SBarry Smith @*/ 5230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5231d71ae5a4SJacob Faibussowitsch { 5232cbcfb4deSHong Zhang PetscInt ii; 523336db0b34SBarry Smith Mat_SeqAIJ *aij; 5234cbcfb4deSHong Zhang PetscInt jj; 523536db0b34SBarry Smith 523636db0b34SBarry Smith PetscFunctionBegin; 5237aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52389566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52409566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52419566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5243ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5246ab93d7beSBarry Smith 524736db0b34SBarry Smith aij->i = i; 524836db0b34SBarry Smith aij->j = j; 524936db0b34SBarry Smith aij->a = a; 525036db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5251e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5252e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 525336db0b34SBarry Smith 5254cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 525536db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 525676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5257aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52589985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 525908401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 526008401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52619985e31cSBarry Smith } 526236db0b34SBarry Smith } 526376bd3646SJed Brown } 526476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 526536db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 526608401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5267da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 526836db0b34SBarry Smith } 526976bd3646SJed Brown } 527036db0b34SBarry Smith 52719566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 527436db0b34SBarry Smith } 5275cbc6b225SStefano Zampini 5276f62e3866SBarry Smith /*@ 527711a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52788a0b0e6bSVictor Minden provided by the user. 52798a0b0e6bSVictor Minden 5280d083f849SBarry Smith Collective 52818a0b0e6bSVictor Minden 52828a0b0e6bSVictor Minden Input Parameters: 52838a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52848a0b0e6bSVictor Minden . m - number of rows 52858a0b0e6bSVictor Minden . n - number of columns 52868a0b0e6bSVictor Minden . i - row indices 52878a0b0e6bSVictor Minden . j - column indices 52881230e6d1SVictor Minden . a - matrix values 52891230e6d1SVictor Minden . nz - number of nonzeros 52902ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 52918a0b0e6bSVictor Minden 52928a0b0e6bSVictor Minden Output Parameter: 52938a0b0e6bSVictor Minden . mat - the matrix 52948a0b0e6bSVictor Minden 52958a0b0e6bSVictor Minden Level: intermediate 52968a0b0e6bSVictor Minden 5297f62e3866SBarry Smith Example: 5298f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52999e99939fSJunchao Zhang .vb 53008a0b0e6bSVictor Minden 1 0 0 53018a0b0e6bSVictor Minden 2 0 3 53028a0b0e6bSVictor Minden 4 5 6 53038a0b0e6bSVictor Minden 53048a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53058a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53068a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53079e99939fSJunchao Zhang .ve 5308fe59aa6dSJacob Faibussowitsch 53092ef1f0ffSBarry Smith Note: 5310d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5311d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53128a0b0e6bSVictor Minden 53131cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53148a0b0e6bSVictor Minden @*/ 5315ce78bad3SBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscCount nz, PetscBool idx) 5316d71ae5a4SJacob Faibussowitsch { 5317d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53188a0b0e6bSVictor Minden 53198a0b0e6bSVictor Minden PetscFunctionBegin; 53209566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5321ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53229566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53239566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53249566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53261230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53271230e6d1SVictor Minden if (idx) { 53281230e6d1SVictor Minden row = i[ii] - 1; 53291230e6d1SVictor Minden col = j[ii] - 1; 53301230e6d1SVictor Minden } else { 53311230e6d1SVictor Minden row = i[ii]; 53321230e6d1SVictor Minden col = j[ii]; 53338a0b0e6bSVictor Minden } 53349566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53358a0b0e6bSVictor Minden } 53369566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53379566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53389566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53408a0b0e6bSVictor Minden } 534136db0b34SBarry Smith 5342d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5343d71ae5a4SJacob Faibussowitsch { 5344acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5345acf2f550SJed Brown 5346acf2f550SJed Brown PetscFunctionBegin; 5347acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5348acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53492205254eSKarl Rupp 53509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5352acf2f550SJed Brown } 5353acf2f550SJed Brown 5354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5355d71ae5a4SJacob Faibussowitsch { 53569c8f2541SHong Zhang PetscFunctionBegin; 53579566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53599c8f2541SHong Zhang } 53609c8f2541SHong Zhang 536181824310SBarry Smith /* 536253dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 536353dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 536453dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 536553dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 536653dd7562SDmitry Karpeev */ 5367d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5368d71ae5a4SJacob Faibussowitsch { 536953dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 537053dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 537153dd7562SDmitry Karpeev PetscBool seqaij; 537253dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 537353dd7562SDmitry Karpeev PetscScalar v; 537453dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 537553dd7562SDmitry Karpeev 537653dd7562SDmitry Karpeev PetscFunctionBegin; 53773ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 537853dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53799566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 538028b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 538153dd7562SDmitry Karpeev if (rowemb) { 53829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 538308401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 538453dd7562SDmitry Karpeev } else { 538508401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 538653dd7562SDmitry Karpeev } 538753dd7562SDmitry Karpeev if (colemb) { 53889566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 538908401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 539053dd7562SDmitry Karpeev } else { 539108401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 539253dd7562SDmitry Karpeev } 539353dd7562SDmitry Karpeev 5394f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 539553dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5397ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 53989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53999566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 540053dd7562SDmitry Karpeev } 540148a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 540253dd7562SDmitry Karpeev count = 0; 540353dd7562SDmitry Karpeev rowindices = NULL; 540453dd7562SDmitry Karpeev colindices = NULL; 540548a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 540648a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 540753dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 540853dd7562SDmitry Karpeev PetscInt row; 540953dd7562SDmitry Karpeev row = i; 541053dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 541153dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 541253dd7562SDmitry Karpeev PetscInt col; 541353dd7562SDmitry Karpeev col = Baij->j[count]; 541453dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 541553dd7562SDmitry Karpeev v = Baij->a[count]; 54169566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 541753dd7562SDmitry Karpeev ++count; 541853dd7562SDmitry Karpeev } 541953dd7562SDmitry Karpeev } 542053dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 542153dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 542253dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 542353dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 542453dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 542653dd7562SDmitry Karpeev } 542753dd7562SDmitry Karpeev 542858c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5429dec0b466SHong Zhang { 5430dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5431dec0b466SHong Zhang MatScalar *aa = a->a; 5432dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5433dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5434dec0b466SHong Zhang 5435dec0b466SHong Zhang PetscFunctionBegin; 5436dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5437dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5438dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5439dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5440dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 544158c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5442dec0b466SHong Zhang else { 5443dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5444dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5445dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5446dec0b466SHong Zhang } 5447dec0b466SHong Zhang } 5448dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5449dec0b466SHong Zhang fshift_prev = fshift; 5450dec0b466SHong Zhang /* reset ilen and imax for each row */ 5451dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5452dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5453dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5454dec0b466SHong Zhang } 5455312eded4SPierre Jolivet if (fshift) { 5456dec0b466SHong Zhang if (m) { 5457dec0b466SHong Zhang ai[m] -= fshift; 5458dec0b466SHong Zhang a->nz = ai[m]; 5459dec0b466SHong Zhang } 5460dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5461312eded4SPierre Jolivet A->nonzerostate++; 5462dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5463dec0b466SHong Zhang a->rmax = rmax; 5464dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5465dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5466dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5467312eded4SPierre Jolivet } 54683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5469dec0b466SHong Zhang } 5470dec0b466SHong Zhang 54714099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54724099cc6bSBarry Smith 5473cc4c1da9SBarry Smith /*@ 547411a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54754099cc6bSBarry Smith 5476c3339decSBarry Smith Collective 54774099cc6bSBarry Smith 54784099cc6bSBarry Smith Input Parameters: 54794099cc6bSBarry Smith + mat - the matrix object 54804099cc6bSBarry Smith - matype - matrix type 54814099cc6bSBarry Smith 54824099cc6bSBarry Smith Options Database Key: 54834e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54844099cc6bSBarry Smith 54854099cc6bSBarry Smith Level: intermediate 54864099cc6bSBarry Smith 5487fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 54884099cc6bSBarry Smith @*/ 5489d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5490d71ae5a4SJacob Faibussowitsch { 54914099cc6bSBarry Smith PetscBool sametype; 54925f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 54934099cc6bSBarry Smith 54944099cc6bSBarry Smith PetscFunctionBegin; 54954099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 54969566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 54973ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 54984099cc6bSBarry Smith 54999566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55006adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55019566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55034099cc6bSBarry Smith } 55044099cc6bSBarry Smith 55054099cc6bSBarry Smith /*@C 550611a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55074099cc6bSBarry Smith 5508cc4c1da9SBarry Smith Not Collective, No Fortran Support 55094099cc6bSBarry Smith 55104099cc6bSBarry Smith Input Parameters: 5511fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55124099cc6bSBarry Smith - function - routine to convert to subtype 55134099cc6bSBarry Smith 55142ef1f0ffSBarry Smith Level: advanced 55152ef1f0ffSBarry Smith 55164099cc6bSBarry Smith Notes: 551711a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55184099cc6bSBarry Smith 55194099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 5520b44f4de4SBarry Smith .vb 5521b44f4de4SBarry Smith -mat_seqaij_type my_mat 5522b44f4de4SBarry Smith .ve 55234099cc6bSBarry Smith 55241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55254099cc6bSBarry Smith @*/ 5526d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5527d71ae5a4SJacob Faibussowitsch { 55284099cc6bSBarry Smith PetscFunctionBegin; 55299566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55309566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55324099cc6bSBarry Smith } 55334099cc6bSBarry Smith 55344099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55354099cc6bSBarry Smith 55364099cc6bSBarry Smith /*@C 553711a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55384099cc6bSBarry Smith 55394099cc6bSBarry Smith Not Collective 55404099cc6bSBarry Smith 55414099cc6bSBarry Smith Level: advanced 55424099cc6bSBarry Smith 55432ef1f0ffSBarry Smith Note: 55442ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55452ef1f0ffSBarry Smith 55461cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55474099cc6bSBarry Smith @*/ 5548d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5549d71ae5a4SJacob Faibussowitsch { 55504099cc6bSBarry Smith PetscFunctionBegin; 55513ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55524099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55534099cc6bSBarry Smith 55549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55579779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5559485f9817SRichard Tran Mills #endif 55605063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55625063d097SStefano Zampini #endif 5563d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5564d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5565d5e393b6SSuyash Tandon #endif 55665063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55685063d097SStefano Zampini #endif 55694099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55714099cc6bSBarry Smith #endif 55723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55734099cc6bSBarry Smith } 557453dd7562SDmitry Karpeev 557553dd7562SDmitry Karpeev /* 557681824310SBarry Smith Special version for direct calls from Fortran 557781824310SBarry Smith */ 557881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 557981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 558081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 558181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 558281824310SBarry Smith #endif 558381824310SBarry Smith 558481824310SBarry Smith /* Change these macros so can be used in void function */ 558598921bdaSJacob Faibussowitsch 558698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55879566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55889566063dSJacob Faibussowitsch #undef PetscCall 55899371c9d4SSatish Balay #define PetscCall(...) \ 55909371c9d4SSatish Balay do { \ 55915f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 559298921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 559398921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 559498921bdaSJacob Faibussowitsch return; \ 559598921bdaSJacob Faibussowitsch } \ 559698921bdaSJacob Faibussowitsch } while (0) 559798921bdaSJacob Faibussowitsch 559898921bdaSJacob Faibussowitsch #undef SETERRQ 55999371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56009371c9d4SSatish Balay do { \ 560198921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 560298921bdaSJacob Faibussowitsch return; \ 560398921bdaSJacob Faibussowitsch } while (0) 560481824310SBarry Smith 5605d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5606d71ae5a4SJacob Faibussowitsch { 560781824310SBarry Smith Mat A = *AA; 560881824310SBarry Smith PetscInt m = *mm, n = *nn; 560981824310SBarry Smith InsertMode is = *isis; 561081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 561181824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 561281824310SBarry Smith PetscInt *imax, *ai, *ailen; 561381824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 561454f21887SBarry Smith MatScalar *ap, value, *aa; 5615ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5616ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 561781824310SBarry Smith 561881824310SBarry Smith PetscFunctionBegin; 56194994cf47SJed Brown MatCheckPreallocated(A, 1); 562081824310SBarry Smith imax = a->imax; 562181824310SBarry Smith ai = a->i; 562281824310SBarry Smith ailen = a->ilen; 562381824310SBarry Smith aj = a->j; 562481824310SBarry Smith aa = a->a; 562581824310SBarry Smith 562681824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 562781824310SBarry Smith row = im[k]; 562881824310SBarry Smith if (row < 0) continue; 56295f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56309371c9d4SSatish Balay rp = aj + ai[row]; 56319371c9d4SSatish Balay ap = aa + ai[row]; 56329371c9d4SSatish Balay rmax = imax[row]; 56339371c9d4SSatish Balay nrow = ailen[row]; 563481824310SBarry Smith low = 0; 563581824310SBarry Smith high = nrow; 563681824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 563781824310SBarry Smith if (in[l] < 0) continue; 56385f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 563981824310SBarry Smith col = in[l]; 56402205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56412205254eSKarl Rupp else value = v[k + l * m]; 56422205254eSKarl Rupp 564381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 564481824310SBarry Smith 56452205254eSKarl Rupp if (col <= lastcol) low = 0; 56462205254eSKarl Rupp else high = nrow; 564781824310SBarry Smith lastcol = col; 564881824310SBarry Smith while (high - low > 5) { 564981824310SBarry Smith t = (low + high) / 2; 565081824310SBarry Smith if (rp[t] > col) high = t; 565181824310SBarry Smith else low = t; 565281824310SBarry Smith } 565381824310SBarry Smith for (i = low; i < high; i++) { 565481824310SBarry Smith if (rp[i] > col) break; 565581824310SBarry Smith if (rp[i] == col) { 565681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 565781824310SBarry Smith else ap[i] = value; 565881824310SBarry Smith goto noinsert; 565981824310SBarry Smith } 566081824310SBarry Smith } 566181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 566281824310SBarry Smith if (nonew == 1) goto noinsert; 56635f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5664fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56659371c9d4SSatish Balay N = nrow++ - 1; 56669371c9d4SSatish Balay a->nz++; 56679371c9d4SSatish Balay high++; 566881824310SBarry Smith /* shift up all the later entries in this row */ 566981824310SBarry Smith for (ii = N; ii >= i; ii--) { 567081824310SBarry Smith rp[ii + 1] = rp[ii]; 567181824310SBarry Smith ap[ii + 1] = ap[ii]; 567281824310SBarry Smith } 567381824310SBarry Smith rp[i] = col; 567481824310SBarry Smith ap[i] = value; 567581824310SBarry Smith noinsert:; 567681824310SBarry Smith low = i + 1; 567781824310SBarry Smith } 567881824310SBarry Smith ailen[row] = nrow; 567981824310SBarry Smith } 568081824310SBarry Smith PetscFunctionReturnVoid(); 568181824310SBarry Smith } 568298921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 568398921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 568498921bdaSJacob Faibussowitsch * original definitions */ 56859566063dSJacob Faibussowitsch #undef PetscCall 568698921bdaSJacob Faibussowitsch #undef SETERRQ 5687