1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 4968e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 533d71ae5a4SJacob Faibussowitsch { 53419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith PetscFunctionBegin; 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53919b08ed1SBarry Smith a->maxnz = nztotal; 5404dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54119b08ed1SBarry Smith if (!a->ilen) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54319b08ed1SBarry Smith } else { 5449566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54519b08ed1SBarry Smith } 54619b08ed1SBarry Smith 54719b08ed1SBarry Smith /* allocate the matrix space */ 54819b08ed1SBarry Smith if (A->structure_only) { 5499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55119b08ed1SBarry Smith } else { 5529566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55319b08ed1SBarry Smith } 55419b08ed1SBarry Smith a->i[0] = 0; 55519b08ed1SBarry Smith if (A->structure_only) { 55619b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55719b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55819b08ed1SBarry Smith } else { 55919b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56019b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56319b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56419b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56619b08ed1SBarry Smith } 56719b08ed1SBarry Smith 568ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 569d71ae5a4SJacob Faibussowitsch { 570071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 571071fcb05SBarry Smith PetscInt *rp, k, row; 572071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 573071fcb05SBarry Smith PetscInt *aj = a->j; 574fff043a9SJunchao Zhang MatScalar *aa, *ap; 575071fcb05SBarry Smith 576071fcb05SBarry Smith PetscFunctionBegin; 5779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 578071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 579071fcb05SBarry Smith row = im[k]; 5806bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 581071fcb05SBarry Smith rp = aj + ai[row]; 582071fcb05SBarry Smith ap = aa + ai[row]; 58348a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 584071fcb05SBarry Smith if (!A->structure_only) { 585071fcb05SBarry Smith if (v) { 5869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 587071fcb05SBarry Smith v += n; 588071fcb05SBarry Smith } else { 5899566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith } 592071fcb05SBarry Smith ailen[row] = n; 593071fcb05SBarry Smith a->nz += n; 594071fcb05SBarry Smith } 5959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 597071fcb05SBarry Smith } 598071fcb05SBarry Smith 599ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 600d71ae5a4SJacob Faibussowitsch { 6017eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60297f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60397f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6044e208921SJed Brown const MatScalar *ap, *aa; 6057eb43aa7SLois Curfman McInnes 6063a40ed3dSBarry Smith PetscFunctionBegin; 6074e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6087eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6097eb43aa7SLois Curfman McInnes row = im[k]; 6109371c9d4SSatish Balay if (row < 0) { 6119371c9d4SSatish Balay v += n; 6129371c9d4SSatish Balay continue; 6139371c9d4SSatish Balay } /* negative row */ 61454c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6158e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6168e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6177eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6187eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6199371c9d4SSatish Balay if (in[l] < 0) { 6209371c9d4SSatish Balay v++; 6219371c9d4SSatish Balay continue; 6229371c9d4SSatish Balay } /* negative column */ 62354c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 624bfeeae90SHong Zhang col = in[l]; 6259371c9d4SSatish Balay high = nrow; 6269371c9d4SSatish Balay low = 0; /* assume unsorted */ 6277eb43aa7SLois Curfman McInnes while (high - low > 5) { 6287eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6297eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6307eb43aa7SLois Curfman McInnes else low = t; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6337eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6347eb43aa7SLois Curfman McInnes if (rp[i] == col) { 635b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6367eb43aa7SLois Curfman McInnes goto finished; 6377eb43aa7SLois Curfman McInnes } 6387eb43aa7SLois Curfman McInnes } 63997e567efSBarry Smith *v++ = 0.0; 6407eb43aa7SLois Curfman McInnes finished:; 6417eb43aa7SLois Curfman McInnes } 6427eb43aa7SLois Curfman McInnes } 6434e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6457eb43aa7SLois Curfman McInnes } 6467eb43aa7SLois Curfman McInnes 647ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 648d71ae5a4SJacob Faibussowitsch { 6493ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 650c898d852SStefano Zampini const PetscScalar *av; 6513ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6523ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65317ab2063SBarry Smith 6543a40ed3dSBarry Smith PetscFunctionBegin; 6559566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6562205254eSKarl Rupp 6573ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6583ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6593ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6603ea6fe3dSLisandro Dalcin nz = A->nz; 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* write matrix header */ 6633ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6649371c9d4SSatish Balay header[1] = M; 6659371c9d4SSatish Balay header[2] = N; 6669371c9d4SSatish Balay header[3] = nz; 6679566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 668416022c9SBarry Smith 6693ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6713ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7193ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7202e5835c6SStefano Zampini 721c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72471c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72597f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72660e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 727c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 728d00d2cf4SBarry Smith nofinalvalue = 1; 729d00d2cf4SBarry Smith } 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 733fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 735fbfe6fa7SJed Brown #else 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 737fbfe6fa7SJed Brown #endif 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73917ab2063SBarry Smith 74017ab2063SBarry Smith for (i = 0; i < m; i++) { 74160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 742aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74417ab2063SBarry Smith #else 7459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74617ab2063SBarry Smith #endif 74717ab2063SBarry Smith } 74817ab2063SBarry Smith } 749d00d2cf4SBarry Smith if (nofinalvalue) { 750c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 752c337ccceSJed Brown #else 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 754c337ccceSJed Brown #endif 755d00d2cf4SBarry Smith } 7569566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 759fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76144cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 764aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76936db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7716831982aSBarry Smith } 77244cd7ae7SLois Curfman McInnes #else 7739566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77444cd7ae7SLois Curfman McInnes #endif 77544cd7ae7SLois Curfman McInnes } 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77744cd7ae7SLois Curfman McInnes } 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 779fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78097f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 783496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 784496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 786496be53dSLois Curfman McInnes if (a->j[j] >= i) { 787aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 789496be53dSLois Curfman McInnes #else 790496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 791496be53dSLois Curfman McInnes #endif 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 7952e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7972e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7982205254eSKarl Rupp if (i + 4 < m) { 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8002205254eSKarl Rupp } else if (i + 3 < m) { 8019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8022205254eSKarl Rupp } else if (i + 2 < m) { 8039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8042205254eSKarl Rupp } else if (i + 1 < m) { 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8062205254eSKarl Rupp } else if (i < m) { 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8082205254eSKarl Rupp } else { 8099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8102205254eSKarl Rupp } 811496be53dSLois Curfman McInnes } 8129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8139566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8169566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 817496be53dSLois Curfman McInnes } 8189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 819496be53dSLois Curfman McInnes } 8209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 821496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 823496be53dSLois Curfman McInnes if (a->j[j] >= i) { 824aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82548a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 826496be53dSLois Curfman McInnes #else 8279566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 828496be53dSLois Curfman McInnes #endif 829496be53dSLois Curfman McInnes } 830496be53dSLois Curfman McInnes } 8319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 832496be53dSLois Curfman McInnes } 8339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 834fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83597f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83687828ca2SBarry Smith PetscScalar value; 83768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83968f1ed48SBarry Smith 84068f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84268f1ed48SBarry Smith realonly = PETSC_FALSE; 84368f1ed48SBarry Smith break; 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith #endif 84702594712SBarry Smith 8489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84902594712SBarry Smith for (i = 0; i < m; i++) { 85002594712SBarry Smith jcnt = 0; 851d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 852e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85302594712SBarry Smith value = a->a[cnt++]; 854e24b481bSBarry Smith jcnt++; 85502594712SBarry Smith } else { 85602594712SBarry Smith value = 0.0; 85702594712SBarry Smith } 858aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85968f1ed48SBarry Smith if (realonly) { 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86168f1ed48SBarry Smith } else { 8629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86368f1ed48SBarry Smith } 86402594712SBarry Smith #else 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86602594712SBarry Smith #endif 86702594712SBarry Smith } 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86902594712SBarry Smith } 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8713c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 872150b93efSMatthew G. Knepley PetscInt fshift = 1; 8739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8743c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8763c215bfdSMatthew Knepley #else 8779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8783c215bfdSMatthew Knepley #endif 8799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8803c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8823c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8839566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8843c215bfdSMatthew Knepley #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8863c215bfdSMatthew Knepley #endif 8873c215bfdSMatthew Knepley } 8883c215bfdSMatthew Knepley } 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8903a40ed3dSBarry Smith } else { 8919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 892d5f3da31SBarry Smith if (A->factortype) { 89316cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89516cd7e1dSShri Abhyankar /* L part */ 89660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90216cd7e1dSShri Abhyankar } else { 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90416cd7e1dSShri Abhyankar } 90516cd7e1dSShri Abhyankar #else 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90716cd7e1dSShri Abhyankar #endif 90816cd7e1dSShri Abhyankar } 90916cd7e1dSShri Abhyankar /* diagonal */ 91016cd7e1dSShri Abhyankar j = a->diag[i]; 91116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91616cd7e1dSShri Abhyankar } else { 9179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91816cd7e1dSShri Abhyankar } 91916cd7e1dSShri Abhyankar #else 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92116cd7e1dSShri Abhyankar #endif 92216cd7e1dSShri Abhyankar 92316cd7e1dSShri Abhyankar /* U part */ 92460e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93016cd7e1dSShri Abhyankar } else { 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93216cd7e1dSShri Abhyankar } 93316cd7e1dSShri Abhyankar #else 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93516cd7e1dSShri Abhyankar #endif 93616cd7e1dSShri Abhyankar } 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar } else { 94017ab2063SBarry Smith for (i = 0; i < m; i++) { 9419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 943aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9483a40ed3dSBarry Smith } else { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95017ab2063SBarry Smith } 95117ab2063SBarry Smith #else 9529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95317ab2063SBarry Smith #endif 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95617ab2063SBarry Smith } 95716cd7e1dSShri Abhyankar } 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95917ab2063SBarry Smith } 9609566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 962416022c9SBarry Smith } 963416022c9SBarry Smith 9649804daf3SBarry Smith #include <petscdraw.h> 965ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 966d71ae5a4SJacob Faibussowitsch { 967480ef9eaSBarry Smith Mat A = (Mat)Aa; 968416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 969383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 970383922c3SLisandro Dalcin int color; 971b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 972b0a32e0cSBarry Smith PetscViewer viewer; 973f3ef73ceSBarry Smith PetscViewerFormat format; 974fff043a9SJunchao Zhang const PetscScalar *aa; 975cddf8d76SBarry Smith 9763a40ed3dSBarry Smith PetscFunctionBegin; 9779566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9799566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 980383922c3SLisandro Dalcin 981416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 983fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 984d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9850513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 986b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 987416022c9SBarry Smith for (i = 0; i < m; i++) { 9889371c9d4SSatish Balay y_l = m - i - 1.0; 9899371c9d4SSatish Balay y_r = y_l + 1.0; 990bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9919371c9d4SSatish Balay x_l = a->j[j]; 9929371c9d4SSatish Balay x_r = x_l + 1.0; 993fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9949566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 995cddf8d76SBarry Smith } 996cddf8d76SBarry Smith } 997b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 998cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9999371c9d4SSatish Balay y_l = m - i - 1.0; 10009371c9d4SSatish Balay y_r = y_l + 1.0; 1001bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10029371c9d4SSatish Balay x_l = a->j[j]; 10039371c9d4SSatish Balay x_r = x_l + 1.0; 1004fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10059566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1006cddf8d76SBarry Smith } 1007cddf8d76SBarry Smith } 1008b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1009cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10109371c9d4SSatish Balay y_l = m - i - 1.0; 10119371c9d4SSatish Balay y_r = y_l + 1.0; 1012bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10139371c9d4SSatish Balay x_l = a->j[j]; 10149371c9d4SSatish Balay x_r = x_l + 1.0; 1015fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10169566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1017416022c9SBarry Smith } 1018416022c9SBarry Smith } 1019d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10200513a670SBarry Smith } else { 10210513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10220513a670SBarry Smith /* first determine max of all nonzero values */ 1023b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1024383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1025b0a32e0cSBarry Smith PetscDraw popup; 10260513a670SBarry Smith 10270513a670SBarry Smith for (i = 0; i < nz; i++) { 1028fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10290513a670SBarry Smith } 1030383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1033383922c3SLisandro Dalcin 1034d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10350513a670SBarry Smith for (i = 0; i < m; i++) { 1036383922c3SLisandro Dalcin y_l = m - i - 1.0; 1037383922c3SLisandro Dalcin y_r = y_l + 1.0; 1038bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1039383922c3SLisandro Dalcin x_l = a->j[j]; 1040383922c3SLisandro Dalcin x_r = x_l + 1.0; 1041fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10429566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10430513a670SBarry Smith count++; 10440513a670SBarry Smith } 10450513a670SBarry Smith } 1046d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10470513a670SBarry Smith } 10489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1050480ef9eaSBarry Smith } 1051cddf8d76SBarry Smith 10529804daf3SBarry Smith #include <petscdraw.h> 1053ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1054d71ae5a4SJacob Faibussowitsch { 1055b0a32e0cSBarry Smith PetscDraw draw; 105636db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1057ace3abfcSBarry Smith PetscBool isnull; 1058480ef9eaSBarry Smith 1059480ef9eaSBarry Smith PetscFunctionBegin; 10609566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10619566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10623ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1063480ef9eaSBarry Smith 10649371c9d4SSatish Balay xr = A->cmap->n; 10659371c9d4SSatish Balay yr = A->rmap->n; 10669371c9d4SSatish Balay h = yr / 10.0; 10679371c9d4SSatish Balay w = xr / 10.0; 10689371c9d4SSatish Balay xr += w; 10699371c9d4SSatish Balay yr += h; 10709371c9d4SSatish Balay xl = -w; 10719371c9d4SSatish Balay yl = -h; 10729566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10739566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10749566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10769566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1078416022c9SBarry Smith } 1079416022c9SBarry Smith 1080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1081d71ae5a4SJacob Faibussowitsch { 1082ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1083416022c9SBarry Smith 10843a40ed3dSBarry Smith PetscFunctionBegin; 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10881baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10891baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10901baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10919566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109317ab2063SBarry Smith } 109419bcc07fSBarry Smith 1095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1096d71ae5a4SJacob Faibussowitsch { 1097416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1098580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1099bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 110054f21887SBarry Smith MatScalar *aa = a->a, *ap; 11013447b6efSHong Zhang PetscReal ratio = 0.6; 110217ab2063SBarry Smith 11033a40ed3dSBarry Smith PetscFunctionBegin; 11043ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1106b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1107b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11089566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1110b215bc84SStefano Zampini } 111117ab2063SBarry Smith 111243ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111317ab2063SBarry Smith for (i = 1; i < m; i++) { 1114416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111517ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111694a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111717ab2063SBarry Smith if (fshift) { 1118bfeeae90SHong Zhang ip = aj + ai[i]; 1119bfeeae90SHong Zhang ap = aa + ai[i]; 112017ab2063SBarry Smith N = ailen[i]; 11219566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112317ab2063SBarry Smith } 112417ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112517ab2063SBarry Smith } 112617ab2063SBarry Smith if (m) { 112717ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112817ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112917ab2063SBarry Smith } 113017ab2063SBarry Smith /* reset ilen and imax for each row */ 11317b083b7cSBarry Smith a->nonzerorowcnt = 0; 1132396832f4SHong Zhang if (A->structure_only) { 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1135396832f4SHong Zhang } else { /* !A->structure_only */ 113617ab2063SBarry Smith for (i = 0; i < m; i++) { 113717ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11387b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113917ab2063SBarry Smith } 1140396832f4SHong Zhang } 1141bfeeae90SHong Zhang a->nz = ai[m]; 1142aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1143bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1144bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1145bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1146bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1147bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1148bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1149bc43efbbSJunchao Zhang break; 1150bc43efbbSJunchao Zhang } 1151bc43efbbSJunchao Zhang } 11529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11552205254eSKarl Rupp 11568e58a170SBarry Smith A->info.mallocs += a->reallocs; 1157dd5f02e7SSatish Balay a->reallocs = 0; 11586712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115936db0b34SBarry Smith a->rmax = rmax; 11604e220ebcSLois Curfman McInnes 116148a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116417ab2063SBarry Smith } 116517ab2063SBarry Smith 1166ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 118299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118399cafbc1SBarry Smith PetscInt i, nz = a->nz; 11842e5835c6SStefano Zampini MatScalar *aa; 118599cafbc1SBarry Smith 118699cafbc1SBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119299cafbc1SBarry Smith } 119399cafbc1SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197fff043a9SJunchao Zhang MatScalar *aa; 11983a40ed3dSBarry Smith 11993a40ed3dSBarry Smith PetscFunctionBegin; 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120517ab2063SBarry Smith } 1206416022c9SBarry Smith 1207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1208d71ae5a4SJacob Faibussowitsch { 1209416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1210d5d45c9bSBarry Smith 12113a40ed3dSBarry Smith PetscFunctionBegin; 1212b4e2f619SBarry Smith if (A->hash_active) { 1213e3c72094SPierre Jolivet A->ops[0] = a->cops; 1214b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1215b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1216b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1217b4e2f619SBarry Smith } 1218b4e2f619SBarry Smith 12193ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12209566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12339566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1235901853e0SKris Buschelman 12366718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12376718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12386718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12396718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12406718818eSStefano Zampini due to different matrix sizes */ 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12426718818eSStefano Zampini 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12532e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12542e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12552e956fe4SStefano Zampini #endif 12564222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12604222ddf1SHong Zhang #endif 1261d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1262d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1264d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1265d5e393b6SSuyash Tandon #endif 12663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12683d0639e7SStefano Zampini #endif 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1270af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1272af8000cdSHong Zhang #endif 1273d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1275d24d4204SJose E. Roman #endif 127663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127963c07aadSStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12962e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130317ab2063SBarry Smith } 130417ab2063SBarry Smith 1305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1306d71ae5a4SJacob Faibussowitsch { 1307416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13083a40ed3dSBarry Smith 13093a40ed3dSBarry Smith PetscFunctionBegin; 1310a65d3064SKris Buschelman switch (op) { 1311d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1312d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1315d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1318d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1319d71ae5a4SJacob Faibussowitsch break; 1320d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1321d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1322d71ae5a4SJacob Faibussowitsch break; 1323d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1324d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1325d71ae5a4SJacob Faibussowitsch break; 1326d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1327d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1328d71ae5a4SJacob Faibussowitsch break; 1329d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1330d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1331d71ae5a4SJacob Faibussowitsch break; 13323d472b54SHong Zhang case MAT_SPD: 1333b1646e73SJed Brown case MAT_SYMMETRIC: 1334b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1335b1646e73SJed Brown case MAT_HERMITIAN: 1336b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1337957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1338b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1339b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1340b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13415021d80fSJed Brown break; 13428c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1343a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1344d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1345d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1348d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1349d71ae5a4SJacob Faibussowitsch break; 1350d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1351d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353071fcb05SBarry Smith case MAT_SORTED_FULL: 1354071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1355071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1356071fcb05SBarry Smith break; 1357d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1358d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch default: 1361d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1362a65d3064SKris Buschelman } 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136417ab2063SBarry Smith } 136517ab2063SBarry Smith 1366ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1367d71ae5a4SJacob Faibussowitsch { 1368416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1369fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1370c898d852SStefano Zampini PetscScalar *x; 1371c898d852SStefano Zampini const PetscScalar *aa; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1377d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1378d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13802c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138435e7444dSHong Zhang } 138535e7444dSHong Zhang 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138735e7444dSHong Zhang for (i = 0; i < n; i++) { 1388fdc842d1SBarry Smith x[i] = 0.0; 138935e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139035e7444dSHong Zhang if (aj[j] == i) { 139135e7444dSHong Zhang x[i] = aa[j]; 139217ab2063SBarry Smith break; 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 139517ab2063SBarry Smith } 13969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139917ab2063SBarry Smith } 140017ab2063SBarry Smith 1401c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1403d71ae5a4SJacob Faibussowitsch { 1404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14055f22a7b3SSebastian Grimberg const MatScalar *aa; 1406d9ca1df4SBarry Smith PetscScalar *y; 1407d9ca1df4SBarry Smith const PetscScalar *x; 1408d0f46423SBarry Smith PetscInt m = A->rmap->n; 14095c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14105f22a7b3SSebastian Grimberg const MatScalar *v; 1411a77337e4SBarry Smith PetscScalar alpha; 1412d9ca1df4SBarry Smith PetscInt n, i, j; 1413d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14143447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1415ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14165c897100SBarry Smith #endif 141717ab2063SBarry Smith 14183a40ed3dSBarry Smith PetscFunctionBegin; 14199566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14219566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14235c897100SBarry Smith 14245c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1425fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14265c897100SBarry Smith #else 14273447b6efSHong Zhang if (usecprow) { 14283447b6efSHong Zhang m = cprow.nrows; 14293447b6efSHong Zhang ii = cprow.i; 14307b2bb3b9SHong Zhang ridx = cprow.rindex; 14313447b6efSHong Zhang } else { 14323447b6efSHong Zhang ii = a->i; 14333447b6efSHong Zhang } 143417ab2063SBarry Smith for (i = 0; i < m; i++) { 14353447b6efSHong Zhang idx = a->j + ii[i]; 1436fff043a9SJunchao Zhang v = aa + ii[i]; 14373447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14383447b6efSHong Zhang if (usecprow) { 14397b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14403447b6efSHong Zhang } else { 144117ab2063SBarry Smith alpha = x[i]; 14423447b6efSHong Zhang } 144304fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144417ab2063SBarry Smith } 14455c897100SBarry Smith #endif 14469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145117ab2063SBarry Smith } 145217ab2063SBarry Smith 1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1454d71ae5a4SJacob Faibussowitsch { 14555c897100SBarry Smith PetscFunctionBegin; 14569566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14579566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14595c897100SBarry Smith } 14605c897100SBarry Smith 1461c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146278b84d54SShri Abhyankar 1463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1464d71ae5a4SJacob Faibussowitsch { 1465416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1466d9fead3dSBarry Smith PetscScalar *y; 146754f21887SBarry Smith const PetscScalar *x; 1468fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1469003131ecSBarry Smith PetscInt m = A->rmap->n; 14700298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14717b083b7cSBarry Smith PetscInt n, i; 1472362ced78SSatish Balay PetscScalar sum; 1473ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147417ab2063SBarry Smith 1475b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147697952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1477fee21e36SBarry Smith #endif 1478fee21e36SBarry Smith 14793a40ed3dSBarry Smith PetscFunctionBegin; 1480b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14819566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1483b215bc84SStefano Zampini } 14849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14869566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1487416022c9SBarry Smith ii = a->i; 14884eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14899566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149097952fefSHong Zhang m = a->compressedrow.nrows; 149197952fefSHong Zhang ii = a->compressedrow.i; 149297952fefSHong Zhang ridx = a->compressedrow.rindex; 149397952fefSHong Zhang for (i = 0; i < m; i++) { 149497952fefSHong Zhang n = ii[i + 1] - ii[i]; 149597952fefSHong Zhang aj = a->j + ii[i]; 1496fff043a9SJunchao Zhang aa = a_a + ii[i]; 149797952fefSHong Zhang sum = 0.0; 1498003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1499003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150097952fefSHong Zhang y[*ridx++] = sum; 150197952fefSHong Zhang } 150297952fefSHong Zhang } else { /* do not use compressed row format */ 1503b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15043d3eaba7SBarry Smith aj = a->j; 1505fff043a9SJunchao Zhang aa = a_a; 1506b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1507b05257ddSBarry Smith #else 150817ab2063SBarry Smith for (i = 0; i < m; i++) { 1509003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1510003131ecSBarry Smith aj = a->j + ii[i]; 1511fff043a9SJunchao Zhang aa = a_a + ii[i]; 151217ab2063SBarry Smith sum = 0.0; 1513003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151417ab2063SBarry Smith y[i] = sum; 151517ab2063SBarry Smith } 15168d195f9aSBarry Smith #endif 1517b05257ddSBarry Smith } 15189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 1525ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1526ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1527d71ae5a4SJacob Faibussowitsch { 1528b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1529b434eb95SMatthew G. Knepley PetscScalar *y; 1530b434eb95SMatthew G. Knepley const PetscScalar *x; 1531fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1532b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1533b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1534b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1535b434eb95SMatthew G. Knepley PetscScalar sum; 1536b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1537b434eb95SMatthew G. Knepley 1538b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1539b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1540b434eb95SMatthew G. Knepley #endif 1541b434eb95SMatthew G. Knepley 1542b434eb95SMatthew G. Knepley PetscFunctionBegin; 15439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15459566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1546b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1547b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1548b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1549b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1550b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1551b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1552b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1553fff043a9SJunchao Zhang aa = a_a + ii[i]; 1554b434eb95SMatthew G. Knepley sum = 0.0; 1555b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1556b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1557b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1558b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1559b434eb95SMatthew G. Knepley } 1560b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15613d3eaba7SBarry Smith ii = a->i; 1562b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1563b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1564b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1565fff043a9SJunchao Zhang aa = a_a + ii[i]; 1566b434eb95SMatthew G. Knepley sum = 0.0; 1567b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1568b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1569b434eb95SMatthew G. Knepley y[i] = sum; 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley } 15729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15749566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1577b434eb95SMatthew G. Knepley } 1578b434eb95SMatthew G. Knepley 1579ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1580ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1581d71ae5a4SJacob Faibussowitsch { 1582b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1583b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1584b434eb95SMatthew G. Knepley const PetscScalar *x; 1585fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1586b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1587b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1588b434eb95SMatthew G. Knepley PetscScalar sum; 1589b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1590b434eb95SMatthew G. Knepley 1591b434eb95SMatthew G. Knepley PetscFunctionBegin; 15929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15939566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15949566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1595b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1597b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1598b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1599b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1600b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1601b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1602b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1603fff043a9SJunchao Zhang aa = a_a + ii[i]; 1604b434eb95SMatthew G. Knepley sum = y[*ridx]; 1605b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1606b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1607b434eb95SMatthew G. Knepley } 1608b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16093d3eaba7SBarry Smith ii = a->i; 1610b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1611b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1612b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1613fff043a9SJunchao Zhang aa = a_a + ii[i]; 1614b434eb95SMatthew G. Knepley sum = y[i]; 1615b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1616b434eb95SMatthew G. Knepley z[i] = sum; 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley } 16199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1624b434eb95SMatthew G. Knepley } 1625b434eb95SMatthew G. Knepley 1626c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1627d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1628d71ae5a4SJacob Faibussowitsch { 1629416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1630f15663dcSBarry Smith PetscScalar *y, *z; 1631f15663dcSBarry Smith const PetscScalar *x; 1632fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1633d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1634d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1635362ced78SSatish Balay PetscScalar sum; 1636ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16379ea0dfa2SSatish Balay 16383a40ed3dSBarry Smith PetscFunctionBegin; 1639b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16409566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1642b215bc84SStefano Zampini } 16439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16459566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16464eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164897952fefSHong Zhang m = a->compressedrow.nrows; 164997952fefSHong Zhang ii = a->compressedrow.i; 165097952fefSHong Zhang ridx = a->compressedrow.rindex; 165197952fefSHong Zhang for (i = 0; i < m; i++) { 165297952fefSHong Zhang n = ii[i + 1] - ii[i]; 165397952fefSHong Zhang aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165597952fefSHong Zhang sum = y[*ridx]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165797952fefSHong Zhang z[*ridx++] = sum; 165897952fefSHong Zhang } 165997952fefSHong Zhang } else { /* do not use compressed row format */ 16603d3eaba7SBarry Smith ii = a->i; 1661f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16623d3eaba7SBarry Smith aj = a->j; 1663fff043a9SJunchao Zhang aa = a_a; 1664f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1665f15663dcSBarry Smith #else 166617ab2063SBarry Smith for (i = 0; i < m; i++) { 1667f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1668f15663dcSBarry Smith aj = a->j + ii[i]; 1669fff043a9SJunchao Zhang aa = a_a + ii[i]; 167017ab2063SBarry Smith sum = y[i]; 1671f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167217ab2063SBarry Smith z[i] = sum; 167317ab2063SBarry Smith } 167402ab625aSSatish Balay #endif 1675f15663dcSBarry Smith } 16769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168117ab2063SBarry Smith } 168217ab2063SBarry Smith 168317ab2063SBarry Smith /* 168417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168517ab2063SBarry Smith */ 1686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1687d71ae5a4SJacob Faibussowitsch { 1688416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1689d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1690c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169117ab2063SBarry Smith 16923a40ed3dSBarry Smith PetscFunctionBegin; 169309f38230SBarry Smith if (!a->diag) { 16949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1695c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169609f38230SBarry Smith } 1697d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1698c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1699c0c07093SJunchao Zhang if (alreadySet) { 1700c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1701c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1702c0c07093SJunchao Zhang } 1703c0c07093SJunchao Zhang 170409f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1705bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1706bfeeae90SHong Zhang if (a->j[j] == i) { 170709f38230SBarry Smith a->diag[i] = j; 170817ab2063SBarry Smith break; 170917ab2063SBarry Smith } 171017ab2063SBarry Smith } 171117ab2063SBarry Smith } 17123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171317ab2063SBarry Smith } 171417ab2063SBarry Smith 1715ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1716d71ae5a4SJacob Faibussowitsch { 171761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172061ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172261ecd0c6SBarry Smith 172361ecd0c6SBarry Smith PetscFunctionBegin; 172461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17269566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172861ecd0c6SBarry Smith } 172961ecd0c6SBarry Smith 173061ecd0c6SBarry Smith if (a->diagonaldense) { 173161ecd0c6SBarry Smith cnt = 0; 173261ecd0c6SBarry Smith } else { 17339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1735349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173661ecd0c6SBarry Smith cnt++; 173761ecd0c6SBarry Smith mdiag[i] = 1; 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith if (!cnt) { 17429566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174361ecd0c6SBarry Smith } else { 1744b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1745b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174661ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 17476ea2a7edSJunchao Zhang const PetscScalar *Aa; 17486ea2a7edSJunchao Zhang 17496ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17506ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 175161ecd0c6SBarry Smith 175261ecd0c6SBarry Smith a->a = NULL; 175361ecd0c6SBarry Smith a->j = NULL; 175461ecd0c6SBarry Smith a->i = NULL; 175561ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1756ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175861ecd0c6SBarry Smith 175961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17619566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176248a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1763447d62f5SStefano Zampini } 17649566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176661ecd0c6SBarry Smith if (singlemalloc) { 17679566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176861ecd0c6SBarry Smith } else { 17699566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17709566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17719566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177261ecd0c6SBarry Smith } 177361ecd0c6SBarry Smith } 17749566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177561ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177761ecd0c6SBarry Smith } 177861ecd0c6SBarry Smith 1779be5855fcSBarry Smith /* 1780be5855fcSBarry Smith Checks for missing diagonals 1781be5855fcSBarry Smith */ 1782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1783d71ae5a4SJacob Faibussowitsch { 1784be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17857734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1786be5855fcSBarry Smith 1787be5855fcSBarry Smith PetscFunctionBegin; 178809f38230SBarry Smith *missing = PETSC_FALSE; 17897734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179009f38230SBarry Smith *missing = PETSC_TRUE; 179109f38230SBarry Smith if (d) *d = 0; 17929566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179309f38230SBarry Smith } else { 179401445905SHong Zhang PetscInt n; 179501445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1796f1e2ffcdSBarry Smith diag = a->diag; 179701445905SHong Zhang for (i = 0; i < n; i++) { 17987734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179909f38230SBarry Smith *missing = PETSC_TRUE; 180009f38230SBarry Smith if (d) *d = i; 18019566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1802358d2f5dSShri Abhyankar break; 180309f38230SBarry Smith } 1804be5855fcSBarry Smith } 1805be5855fcSBarry Smith } 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1807be5855fcSBarry Smith } 1808be5855fcSBarry Smith 18090da83c2eSBarry Smith #include <petscblaslapack.h> 18100da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18110da83c2eSBarry Smith 18120da83c2eSBarry Smith /* 18130da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18140da83c2eSBarry Smith */ 1815ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1816d71ae5a4SJacob Faibussowitsch { 18170da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18180da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18190da83c2eSBarry Smith const PetscReal shift = 0.0; 18200da83c2eSBarry Smith PetscInt ipvt[5]; 18214e208921SJed Brown PetscCount flops = 0; 18220da83c2eSBarry Smith PetscScalar work[25], *v_work; 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith PetscFunctionBegin; 18250da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18260da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182708401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1828ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 183048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18310da83c2eSBarry Smith ncnt = 0; 18320da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18330da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18350da83c2eSBarry Smith switch (bsizes[i]) { 1836d71ae5a4SJacob Faibussowitsch case 1: 1837d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1838d71ae5a4SJacob Faibussowitsch break; 18390da83c2eSBarry Smith case 2: 18409566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18430da83c2eSBarry Smith break; 18440da83c2eSBarry Smith case 3: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith case 4: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 5: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 6: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 7: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith default: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18730da83c2eSBarry Smith } 18740da83c2eSBarry Smith ncnt += bsizes[i]; 18750da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18764e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18770da83c2eSBarry Smith } 18783ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187948a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18809566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18820da83c2eSBarry Smith } 18830da83c2eSBarry Smith 1884422a814eSBarry Smith /* 1885422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1886422a814eSBarry Smith */ 1887ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1888d71ae5a4SJacob Faibussowitsch { 188971f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1890d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18912e5835c6SStefano Zampini const MatScalar *v; 189254f21887SBarry Smith PetscScalar *idiag, *mdiag; 189371f1c65dSBarry Smith 189471f1c65dSBarry Smith PetscFunctionBegin; 18953ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189771f1c65dSBarry Smith diag = a->diag; 18984dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18992e5835c6SStefano Zampini 190071f1c65dSBarry Smith mdiag = a->mdiag; 190171f1c65dSBarry Smith idiag = a->idiag; 19029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1903422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190471f1c65dSBarry Smith for (i = 0; i < m; i++) { 190571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1906899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1907899639b0SHong Zhang if (PetscRealPart(fshift)) { 19089566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19097b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19107b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19117b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191298921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1913899639b0SHong Zhang } 191471f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191571f1c65dSBarry Smith } 19169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191771f1c65dSBarry Smith } else { 191871f1c65dSBarry Smith for (i = 0; i < m; i++) { 191971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192071f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192171f1c65dSBarry Smith } 19229566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192371f1c65dSBarry Smith } 192471f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192771f1c65dSBarry Smith } 192871f1c65dSBarry Smith 1929d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1930d71ae5a4SJacob Faibussowitsch { 1931416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1932e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19332e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193454f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19353d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193697f1f81fSBarry Smith const PetscInt *idx, *diag; 193717ab2063SBarry Smith 19383a40ed3dSBarry Smith PetscFunctionBegin; 1939b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19409566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1942b215bc84SStefano Zampini } 1943b965ef7fSBarry Smith its = its * lits; 194491723122SBarry Smith 194571f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19469566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194771f1c65dSBarry Smith a->fshift = fshift; 194871f1c65dSBarry Smith a->omega = omega; 1949ed480e8bSBarry Smith 195071f1c65dSBarry Smith diag = a->diag; 195171f1c65dSBarry Smith t = a->ssor_work; 1952ed480e8bSBarry Smith idiag = a->idiag; 195371f1c65dSBarry Smith mdiag = a->mdiag; 1954ed480e8bSBarry Smith 19559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19569566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19579566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1958ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1961ed480e8bSBarry Smith bs = b; 196217ab2063SBarry Smith for (i = 0; i < m; i++) { 196371f1c65dSBarry Smith d = fshift + mdiag[i]; 1964416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1965ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19662e5835c6SStefano Zampini v = aa + diag[i] + 1; 196717ab2063SBarry Smith sum = b[i] * d / omega; 1968003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196917ab2063SBarry Smith x[i] = sum; 197017ab2063SBarry Smith } 19719566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197617ab2063SBarry Smith } 1977c783ea89SBarry Smith 197808401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1979f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19804c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1981887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198217ab2063SBarry Smith 198317ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198417ab2063SBarry Smith 1985887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198617ab2063SBarry Smith */ 198717ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198817ab2063SBarry Smith 198917ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1991416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1992ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19932e5835c6SStefano Zampini v = aa + diag[i] + 1; 199417ab2063SBarry Smith sum = b[i]; 1995e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1996ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199717ab2063SBarry Smith } 199817ab2063SBarry Smith 199917ab2063SBarry Smith /* t = b - (2*E - D)x */ 20002e5835c6SStefano Zampini v = aa; 20012205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200217ab2063SBarry Smith 200317ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2004ed480e8bSBarry Smith ts = t; 2005416022c9SBarry Smith diag = a->diag; 200617ab2063SBarry Smith for (i = 0; i < m; i++) { 2007416022c9SBarry Smith n = diag[i] - a->i[i]; 2008ed480e8bSBarry Smith idx = a->j + a->i[i]; 20092e5835c6SStefano Zampini v = aa + a->i[i]; 201017ab2063SBarry Smith sum = t[i]; 2011003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2012ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2013733d66baSBarry Smith /* x = x + t */ 2014733d66baSBarry Smith x[i] += t[i]; 201517ab2063SBarry Smith } 201617ab2063SBarry Smith 20179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202117ab2063SBarry Smith } 202217ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202417ab2063SBarry Smith for (i = 0; i < m; i++) { 2025416022c9SBarry Smith n = diag[i] - a->i[i]; 2026ed480e8bSBarry Smith idx = a->j + a->i[i]; 20272e5835c6SStefano Zampini v = aa + a->i[i]; 202817ab2063SBarry Smith sum = b[i]; 2029e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20305c99c7daSBarry Smith t[i] = sum; 2031ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203217ab2063SBarry Smith } 20335c99c7daSBarry Smith xb = t; 20349566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20353a40ed3dSBarry Smith } else xb = b; 203617ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2038416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2039ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20402e5835c6SStefano Zampini v = aa + diag[i] + 1; 204117ab2063SBarry Smith sum = xb[i]; 2042e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20435c99c7daSBarry Smith if (xb == b) { 2044ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20455c99c7daSBarry Smith } else { 2046b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204717ab2063SBarry Smith } 20485c99c7daSBarry Smith } 20499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205017ab2063SBarry Smith } 205117ab2063SBarry Smith its--; 205217ab2063SBarry Smith } 205317ab2063SBarry Smith while (its--) { 205417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205517ab2063SBarry Smith for (i = 0; i < m; i++) { 2056b19a5dc2SMark Adams /* lower */ 2057b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2058ed480e8bSBarry Smith idx = a->j + a->i[i]; 20592e5835c6SStefano Zampini v = aa + a->i[i]; 206017ab2063SBarry Smith sum = b[i]; 2061e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2062b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2063b19a5dc2SMark Adams /* upper */ 2064b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2065b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20662e5835c6SStefano Zampini v = aa + diag[i] + 1; 2067b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2068b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206917ab2063SBarry Smith } 2070b19a5dc2SMark Adams xb = t; 20719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2072b19a5dc2SMark Adams } else xb = b; 207317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2075b19a5dc2SMark Adams sum = xb[i]; 2076b19a5dc2SMark Adams if (xb == b) { 2077b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2078416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2079ed480e8bSBarry Smith idx = a->j + a->i[i]; 20802e5835c6SStefano Zampini v = aa + a->i[i]; 2081e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2082ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2083b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2084b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2085b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20862e5835c6SStefano Zampini v = aa + diag[i] + 1; 2087b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2088b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208917ab2063SBarry Smith } 2090b19a5dc2SMark Adams } 2091b19a5dc2SMark Adams if (xb == b) { 20929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2093b19a5dc2SMark Adams } else { 20949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2095b19a5dc2SMark Adams } 209617ab2063SBarry Smith } 209717ab2063SBarry Smith } 20989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20999566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 21009566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210217ab2063SBarry Smith } 210317ab2063SBarry Smith 2104ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2105d71ae5a4SJacob Faibussowitsch { 2106416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21074e220ebcSLois Curfman McInnes 21083a40ed3dSBarry Smith PetscFunctionBegin; 21094e220ebcSLois Curfman McInnes info->block_size = 1.0; 21103966268fSBarry Smith info->nz_allocated = a->maxnz; 21113966268fSBarry Smith info->nz_used = a->nz; 21123966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21133966268fSBarry Smith info->assemblies = A->num_ass; 21143966268fSBarry Smith info->mallocs = A->info.mallocs; 21154dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2116d5f3da31SBarry Smith if (A->factortype) { 21174e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21184e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21194e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21204e220ebcSLois Curfman McInnes } else { 21214e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21224e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21234e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21244e220ebcSLois Curfman McInnes } 21253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212617ab2063SBarry Smith } 212717ab2063SBarry Smith 2128ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2129d71ae5a4SJacob Faibussowitsch { 2130416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2131c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213297b48c8fSBarry Smith const PetscScalar *xx; 21332e5835c6SStefano Zampini PetscScalar *bb, *aa; 2134c7da8527SEric Chamberland PetscInt d = 0; 213517ab2063SBarry Smith 21363a40ed3dSBarry Smith PetscFunctionBegin; 213797b48c8fSBarry Smith if (x && b) { 21389566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21399566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 214097b48c8fSBarry Smith for (i = 0; i < N; i++) { 2141aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2142447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214397b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214497b48c8fSBarry Smith } 21459566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21469566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214797b48c8fSBarry Smith } 214897b48c8fSBarry Smith 21499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2150a9817697SBarry Smith if (a->keepnonzeropattern) { 2151f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2152aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21539566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2154f1e2ffcdSBarry Smith } 2155f4df32b1SMatthew Knepley if (diag != 0.0) { 2156c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2157c7da8527SEric Chamberland d = rows[i]; 2158447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215908401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2160c7da8527SEric Chamberland } 2161f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2162447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21632e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2164f1e2ffcdSBarry Smith } 2165f1e2ffcdSBarry Smith } 2166f1e2ffcdSBarry Smith } else { 2167f4df32b1SMatthew Knepley if (diag != 0.0) { 216817ab2063SBarry Smith for (i = 0; i < N; i++) { 2169aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21707ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2171447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2172447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2173447d62f5SStefano Zampini } else { 2174416022c9SBarry Smith a->ilen[rows[i]] = 1; 21752e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2176bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2177447d62f5SStefano Zampini } 2178447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21799566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 218017ab2063SBarry Smith } 218117ab2063SBarry Smith } 21823a40ed3dSBarry Smith } else { 218317ab2063SBarry Smith for (i = 0; i < N; i++) { 2184aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2185416022c9SBarry Smith a->ilen[rows[i]] = 0; 218617ab2063SBarry Smith } 218717ab2063SBarry Smith } 2188e56f5c9eSBarry Smith A->nonzerostate++; 2189f1e2ffcdSBarry Smith } 21909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2191dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219317ab2063SBarry Smith } 219417ab2063SBarry Smith 2195ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2196d71ae5a4SJacob Faibussowitsch { 21976e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21986e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21992b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 22006e169961SBarry Smith const PetscScalar *xx; 22012e5835c6SStefano Zampini PetscScalar *bb, *aa; 22026e169961SBarry Smith 22036e169961SBarry Smith PetscFunctionBegin; 22043ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22066e169961SBarry Smith if (x && b) { 22079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22089566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22092b40b63fSBarry Smith vecs = PETSC_TRUE; 22106e169961SBarry Smith } 22119566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22126e169961SBarry Smith for (i = 0; i < N; i++) { 2213aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22148e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22152205254eSKarl Rupp 22166e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22176e169961SBarry Smith } 22186e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22196e169961SBarry Smith if (!zeroed[i]) { 22206e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22214cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22222e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22232e5835c6SStefano Zampini aa[j] = 0.0; 22246e169961SBarry Smith } 22256e169961SBarry Smith } 22264cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22276e169961SBarry Smith } 22286e169961SBarry Smith if (x && b) { 22299566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22309566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22316e169961SBarry Smith } 22329566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22336e169961SBarry Smith if (diag != 0.0) { 22349566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22351d5a398dSstefano_zampini if (missing) { 22361d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22374cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2238aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22399566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22401d5a398dSstefano_zampini } 22411d5a398dSstefano_zampini } else { 2242ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22436e169961SBarry Smith } 22441d5a398dSstefano_zampini } 22459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2246dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22486e169961SBarry Smith } 22496e169961SBarry Smith 2250d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2251d71ae5a4SJacob Faibussowitsch { 2252fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2253fff043a9SJunchao Zhang const PetscScalar *aa; 225417ab2063SBarry Smith 22553a40ed3dSBarry Smith PetscFunctionBegin; 22569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2257416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22588e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225917ab2063SBarry Smith if (idx) { 22605c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2261f4259b30SLisandro Dalcin else *idx = NULL; 226217ab2063SBarry Smith } 22639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226517ab2063SBarry Smith } 226617ab2063SBarry Smith 2267d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2268d71ae5a4SJacob Faibussowitsch { 22693a40ed3dSBarry Smith PetscFunctionBegin; 22703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227117ab2063SBarry Smith } 227217ab2063SBarry Smith 2273ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2274d71ae5a4SJacob Faibussowitsch { 2275416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22762e5835c6SStefano Zampini const MatScalar *v; 227736db0b34SBarry Smith PetscReal sum = 0.0; 227897f1f81fSBarry Smith PetscInt i, j; 227917ab2063SBarry Smith 22803a40ed3dSBarry Smith PetscFunctionBegin; 22819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228217ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2283570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2284570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2285792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2286570b7f6dSBarry Smith #else 2287416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22889371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22899371c9d4SSatish Balay v++; 229017ab2063SBarry Smith } 22918f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2292570b7f6dSBarry Smith #endif 22939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22943a40ed3dSBarry Smith } else if (type == NORM_1) { 229536db0b34SBarry Smith PetscReal *tmp; 229697f1f81fSBarry Smith PetscInt *jj = a->j; 22979566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2298064f8208SBarry Smith *nrm = 0.0; 2299416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23009371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23019371c9d4SSatish Balay v++; 230217ab2063SBarry Smith } 2303d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2304064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230517ab2063SBarry Smith } 23069566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23083a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2309064f8208SBarry Smith *nrm = 0.0; 2310d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23118e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 231217ab2063SBarry Smith sum = 0.0; 2313416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23149371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23159371c9d4SSatish Balay v2++; 231617ab2063SBarry Smith } 2317064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231817ab2063SBarry Smith } 23199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2320f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232317ab2063SBarry Smith } 232417ab2063SBarry Smith 2325ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2326d71ae5a4SJacob Faibussowitsch { 23273d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232854f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23292e5835c6SStefano Zampini const MatScalar *va, *vb; 233097f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2331cd0d46ebSvictorle 2332cd0d46ebSvictorle PetscFunctionBegin; 23339566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23349566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23355485867bSBarry Smith if (ma != nb || na != mb) { 23365485867bSBarry Smith *f = PETSC_FALSE; 23373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23385485867bSBarry Smith } 23399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23419371c9d4SSatish Balay aii = aij->i; 23429371c9d4SSatish Balay bii = bij->i; 23439371c9d4SSatish Balay adx = aij->j; 23449371c9d4SSatish Balay bdx = bij->j; 23459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2347cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2348cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2349cd0d46ebSvictorle 2350cd0d46ebSvictorle *f = PETSC_TRUE; 2351cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2352cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235397f1f81fSBarry Smith PetscInt idc, idr; 23545485867bSBarry Smith PetscScalar vc, vr; 2355cd0d46ebSvictorle /* column/row index/value */ 23565485867bSBarry Smith idc = adx[aptr[i]]; 23575485867bSBarry Smith idr = bdx[bptr[idc]]; 23585485867bSBarry Smith vc = va[aptr[i]]; 23595485867bSBarry Smith vr = vb[bptr[idc]]; 23605485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23615485867bSBarry Smith *f = PETSC_FALSE; 23625485867bSBarry Smith goto done; 2363cd0d46ebSvictorle } else { 23645485867bSBarry Smith aptr[i]++; 23655485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2366cd0d46ebSvictorle } 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle } 2369cd0d46ebSvictorle done: 23709566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23719566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2375cd0d46ebSvictorle } 2376cd0d46ebSvictorle 2377ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2378d71ae5a4SJacob Faibussowitsch { 23793d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238054f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238154f21887SBarry Smith MatScalar *va, *vb; 23821cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23831cbb95d3SBarry Smith 23841cbb95d3SBarry Smith PetscFunctionBegin; 23859566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23869566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23871cbb95d3SBarry Smith if (ma != nb || na != mb) { 23881cbb95d3SBarry Smith *f = PETSC_FALSE; 23893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23901cbb95d3SBarry Smith } 23919371c9d4SSatish Balay aii = aij->i; 23929371c9d4SSatish Balay bii = bij->i; 23939371c9d4SSatish Balay adx = aij->j; 23949371c9d4SSatish Balay bdx = bij->j; 23959371c9d4SSatish Balay va = aij->a; 23969371c9d4SSatish Balay vb = bij->a; 23979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23991cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24001cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24011cbb95d3SBarry Smith 24021cbb95d3SBarry Smith *f = PETSC_TRUE; 24031cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24041cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24051cbb95d3SBarry Smith PetscInt idc, idr; 24061cbb95d3SBarry Smith PetscScalar vc, vr; 24071cbb95d3SBarry Smith /* column/row index/value */ 24081cbb95d3SBarry Smith idc = adx[aptr[i]]; 24091cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24101cbb95d3SBarry Smith vc = va[aptr[i]]; 24111cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24121cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24131cbb95d3SBarry Smith *f = PETSC_FALSE; 24141cbb95d3SBarry Smith goto done; 24151cbb95d3SBarry Smith } else { 24161cbb95d3SBarry Smith aptr[i]++; 24171cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24181cbb95d3SBarry Smith } 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith } 24211cbb95d3SBarry Smith done: 24229566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24239566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24251cbb95d3SBarry Smith } 24261cbb95d3SBarry Smith 2427ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2428d71ae5a4SJacob Faibussowitsch { 24299e29f15eSvictorle PetscFunctionBegin; 24309566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24329e29f15eSvictorle } 24339e29f15eSvictorle 2434ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2435d71ae5a4SJacob Faibussowitsch { 24361cbb95d3SBarry Smith PetscFunctionBegin; 24379566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24391cbb95d3SBarry Smith } 24401cbb95d3SBarry Smith 2441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2442d71ae5a4SJacob Faibussowitsch { 2443416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2444fff8e43fSBarry Smith const PetscScalar *l, *r; 2445fff8e43fSBarry Smith PetscScalar x; 244654f21887SBarry Smith MatScalar *v; 2447fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2448fff8e43fSBarry Smith const PetscInt *jj; 244917ab2063SBarry Smith 24503a40ed3dSBarry Smith PetscFunctionBegin; 245117ab2063SBarry Smith if (ll) { 24523ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24533ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24549566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 245508401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24569566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 245817ab2063SBarry Smith for (i = 0; i < m; i++) { 245917ab2063SBarry Smith x = l[i]; 2460416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24612205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 246217ab2063SBarry Smith } 24639566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24649566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 246617ab2063SBarry Smith } 246717ab2063SBarry Smith if (rr) { 24689566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 246908401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24709566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24722e5835c6SStefano Zampini jj = a->j; 24732205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 247717ab2063SBarry Smith } 24789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 248017ab2063SBarry Smith } 248117ab2063SBarry Smith 2482d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2483d71ae5a4SJacob Faibussowitsch { 2484db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2485d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 248697f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24875d0c19d7SBarry Smith const PetscInt *irow, *icol; 24882e5835c6SStefano Zampini const PetscScalar *aa; 24895d0c19d7SBarry Smith PetscInt nrows, ncols; 249097f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2491fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2492416022c9SBarry Smith Mat C; 2493cdc6f3adSToby Isaac PetscBool stride; 249417ab2063SBarry Smith 24953a40ed3dSBarry Smith PetscFunctionBegin; 24969566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24979566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24989566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 249917ab2063SBarry Smith 25009566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2501ff718158SBarry Smith if (stride) { 25029566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2503ff718158SBarry Smith } else { 2504ff718158SBarry Smith first = 0; 2505ff718158SBarry Smith step = 0; 2506ff718158SBarry Smith } 2507fee21e36SBarry Smith if (stride && step == 1) { 250802834360SBarry Smith /* special case of contiguous rows */ 25099566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 251002834360SBarry Smith /* loop over new rows determining lens and starting points */ 251102834360SBarry Smith for (i = 0; i < nrows; i++) { 2512bfeeae90SHong Zhang kstart = ai[irow[i]]; 2513a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2514a91a9bebSLisandro Dalcin starts[i] = kstart; 251502834360SBarry Smith for (k = kstart; k < kend; k++) { 2516bfeeae90SHong Zhang if (aj[k] >= first) { 251702834360SBarry Smith starts[i] = k; 251802834360SBarry Smith break; 251902834360SBarry Smith } 252002834360SBarry Smith } 2521a2744918SBarry Smith sum = 0; 252202834360SBarry Smith while (k < kend) { 2523bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2524a2744918SBarry Smith sum++; 252502834360SBarry Smith } 2526a2744918SBarry Smith lens[i] = sum; 252702834360SBarry Smith } 252802834360SBarry Smith /* create submatrix */ 2529cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 253097f1f81fSBarry Smith PetscInt n_cols, n_rows; 25319566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2532aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25339566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 253408480c60SBarry Smith C = *B; 25353a40ed3dSBarry Smith } else { 25363bef6203SJed Brown PetscInt rbs, cbs; 25379566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25399566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25409566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25419566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25429566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 254408480c60SBarry Smith } 2545db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2546db02288aSLois Curfman McInnes 254702834360SBarry Smith /* loop over rows inserting into submatrix */ 2548fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2549db02288aSLois Curfman McInnes j_new = c->j; 2550db02288aSLois Curfman McInnes i_new = c->i; 25519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 255202834360SBarry Smith for (i = 0; i < nrows; i++) { 2553a2744918SBarry Smith ii = starts[i]; 2554a2744918SBarry Smith lensi = lens[i]; 2555810441c8SPierre Jolivet if (lensi) { 2556ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2558a2744918SBarry Smith a_new += lensi; 2559810441c8SPierre Jolivet } 2560a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2561a2744918SBarry Smith c->ilen[i] = lensi; 256202834360SBarry Smith } 2563fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25659566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25663a40ed3dSBarry Smith } else { 25679566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25689566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25704dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25716bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25724dcab191SBarry Smith smap[icol[i]] = i + 1; 25734dcab191SBarry Smith } 25744dcab191SBarry Smith 257502834360SBarry Smith /* determine lens of each row */ 257602834360SBarry Smith for (i = 0; i < nrows; i++) { 2577bfeeae90SHong Zhang kstart = ai[irow[i]]; 257802834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 257902834360SBarry Smith lens[i] = 0; 258002834360SBarry Smith for (k = kstart; k < kend; k++) { 2581ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 258202834360SBarry Smith } 258302834360SBarry Smith } 258417ab2063SBarry Smith /* Create and fill new matrix */ 2585a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2586ace3abfcSBarry Smith PetscBool equal; 25870f5bd95cSBarry Smith 258899141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2589aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25909566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2591fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25929566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 259308480c60SBarry Smith C = *B; 25943a40ed3dSBarry Smith } else { 25953bef6203SJed Brown PetscInt rbs, cbs; 25969566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25979566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25989566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25999566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 260037a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 26019566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 26029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 260308480c60SBarry Smith } 26049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2605fb3c7e2dSJunchao Zhang 260699141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2607fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 260817ab2063SBarry Smith for (i = 0; i < nrows; i++) { 260999141d43SSatish Balay row = irow[i]; 2610bfeeae90SHong Zhang kstart = ai[row]; 261199141d43SSatish Balay kend = kstart + a->ilen[row]; 2612bfeeae90SHong Zhang mat_i = c->i[i]; 26138e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26148e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 261599141d43SSatish Balay mat_ilen = c->ilen + i; 261617ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2617bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2618ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26192e5835c6SStefano Zampini *mat_a++ = aa[k]; 262099141d43SSatish Balay (*mat_ilen)++; 262117ab2063SBarry Smith } 262217ab2063SBarry Smith } 262317ab2063SBarry Smith } 26249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 262502834360SBarry Smith /* Free work space */ 26269566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26279566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26289566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2629cdc6f3adSToby Isaac /* sort */ 2630cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2631cdc6f3adSToby Isaac PetscInt ilen; 2632cdc6f3adSToby Isaac 2633cdc6f3adSToby Isaac mat_i = c->i[i]; 26348e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26358e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2636cdc6f3adSToby Isaac ilen = c->ilen[i]; 26379566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2638cdc6f3adSToby Isaac } 2639fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 264002834360SBarry Smith } 26418c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26429566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2643305c6ccfSStefano Zampini #endif 26449566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26459566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 264617ab2063SBarry Smith 26479566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2648416022c9SBarry Smith *B = C; 26493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265017ab2063SBarry Smith } 265117ab2063SBarry Smith 2652ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2653d71ae5a4SJacob Faibussowitsch { 265482d44351SHong Zhang Mat B; 265582d44351SHong Zhang 265682d44351SHong Zhang PetscFunctionBegin; 2657c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26589566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26599566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26609566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26619566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26629566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 266382d44351SHong Zhang *subMat = B; 2664c2d650bdSHong Zhang } else { 26659566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2666c2d650bdSHong Zhang } 26673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 266882d44351SHong Zhang } 266982d44351SHong Zhang 2670ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2671d71ae5a4SJacob Faibussowitsch { 267263b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 267363b91edcSBarry Smith Mat outA; 2674ace3abfcSBarry Smith PetscBool row_identity, col_identity; 267563b91edcSBarry Smith 26763a40ed3dSBarry Smith PetscFunctionBegin; 267708401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26781df811f5SHong Zhang 26799566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26809566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2681a871dcd8SBarry Smith 268263b91edcSBarry Smith outA = inA; 2683d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26849566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26859566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26862205254eSKarl Rupp 26879566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26889566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26892205254eSKarl Rupp 2690c3122656SLisandro Dalcin a->row = row; 26912205254eSKarl Rupp 26929566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26942205254eSKarl Rupp 2695c3122656SLisandro Dalcin a->col = col; 269663b91edcSBarry Smith 269736db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26989566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26999566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2700f0ec6fceSSatish Balay 270194a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 270394a9d846SBarry Smith } 270463b91edcSBarry Smith 27059566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2706137fb511SHong Zhang if (row_identity && col_identity) { 27079566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2708137fb511SHong Zhang } else { 27099566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2710137fb511SHong Zhang } 27113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2712a871dcd8SBarry Smith } 2713a871dcd8SBarry Smith 2714d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2715d71ae5a4SJacob Faibussowitsch { 2716f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2717dfa0f9e5SStefano Zampini PetscScalar *v; 2718c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27193a40ed3dSBarry Smith 27203a40ed3dSBarry Smith PetscFunctionBegin; 27219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27229566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2723792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27249566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2728f0b747eeSBarry Smith } 2729f0b747eeSBarry Smith 2730d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2731d71ae5a4SJacob Faibussowitsch { 273216b64355SHong Zhang PetscInt i; 273316b64355SHong Zhang 273416b64355SHong Zhang PetscFunctionBegin; 273516b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27369566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 273716b64355SHong Zhang 273848a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27399566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 274016b64355SHong Zhang 274116b64355SHong Zhang if (submatj->rbuf1) { 27429566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27439566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 274416b64355SHong Zhang } 274516b64355SHong Zhang 274648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27479566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 274916b64355SHong Zhang } 275016b64355SHong Zhang 275116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2752eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27539566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27549566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 275516b64355SHong Zhang #else 27569566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 275716b64355SHong Zhang #endif 275816b64355SHong Zhang 275916b64355SHong Zhang if (!submatj->allcolumns) { 276016b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2761eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 276216b64355SHong Zhang #else 27639566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 276416b64355SHong Zhang #endif 276516b64355SHong Zhang } 27669566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 276716b64355SHong Zhang 27689566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277016b64355SHong Zhang } 277116b64355SHong Zhang 2772d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2773d71ae5a4SJacob Faibussowitsch { 277416b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27755c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 277616b64355SHong Zhang 277716b64355SHong Zhang PetscFunctionBegin; 27789566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27799566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 278116b64355SHong Zhang } 278216b64355SHong Zhang 278389a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2784ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2785d71ae5a4SJacob Faibussowitsch { 27862d033e1fSHong Zhang PetscInt i; 27870fb991dcSHong Zhang Mat C; 27880fb991dcSHong Zhang Mat_SeqAIJ *c; 27890fb991dcSHong Zhang Mat_SubSppt *submatj; 27902d033e1fSHong Zhang 27912d033e1fSHong Zhang PetscFunctionBegin; 27922d033e1fSHong Zhang for (i = 0; i < n; i++) { 27930fb991dcSHong Zhang C = (*mat)[i]; 27940fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27950fb991dcSHong Zhang submatj = c->submatis1; 27962d033e1fSHong Zhang if (submatj) { 2797682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 279826cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27999566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28009566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28019566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28023faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 28039566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28049566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28059566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2806682e4c99SStefano Zampini } 28072d033e1fSHong Zhang } else { 28089566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28092d033e1fSHong Zhang } 28102d033e1fSHong Zhang } 281186e85357SHong Zhang 281263a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28139566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 281463a75b2aSHong Zhang 28159566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28172d033e1fSHong Zhang } 28182d033e1fSHong Zhang 2819ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2820d71ae5a4SJacob Faibussowitsch { 282197f1f81fSBarry Smith PetscInt i; 2822cddf8d76SBarry Smith 28233a40ed3dSBarry Smith PetscFunctionBegin; 282448a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2825cddf8d76SBarry Smith 282648a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2828cddf8d76SBarry Smith } 2829cddf8d76SBarry Smith 2830ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2831d71ae5a4SJacob Faibussowitsch { 2832e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28339a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28345d0c19d7SBarry Smith const PetscInt *idx; 28359a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2836f1af5d2fSBarry Smith PetscBT table; 2837bbd702dbSSatish Balay 28383a40ed3dSBarry Smith PetscFunctionBegin; 28399a88ca10SBarry Smith m = A->rmap->n / bs; 2840e4d965acSSatish Balay ai = a->i; 2841bfeeae90SHong Zhang aj = a->j; 28428a047759SSatish Balay 284308401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 284406763907SSatish Balay 28459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28469566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 284706763907SSatish Balay 2848e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2849b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2850e4d965acSSatish Balay isz = 0; 28519566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2852e4d965acSSatish Balay 2853e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28549566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28559566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2856e4d965acSSatish Balay 28579a88ca10SBarry Smith if (bs > 1) { 28589a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28599a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28609a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28619a88ca10SBarry Smith } 28629a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28639a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28649a88ca10SBarry Smith 28659a88ca10SBarry Smith k = 0; 28669a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28679a88ca10SBarry Smith n = isz; 28689a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28699a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28709a88ca10SBarry Smith row = bs * nidx[k] + ll; 28719a88ca10SBarry Smith start = ai[row]; 28729a88ca10SBarry Smith end = ai[row + 1]; 28739a88ca10SBarry Smith for (l = start; l < end; l++) { 28749a88ca10SBarry Smith val = aj[l] / bs; 28759a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28769a88ca10SBarry Smith } 28779a88ca10SBarry Smith } 28789a88ca10SBarry Smith } 28799a88ca10SBarry Smith } 28809a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28819a88ca10SBarry Smith } else { 2882dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2883e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28842205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28854dcbc457SBarry Smith } 28869566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28879566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2888e4d965acSSatish Balay 288904a348a9SBarry Smith k = 0; 289004a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 289104a348a9SBarry Smith n = isz; 289206763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2893e4d965acSSatish Balay row = nidx[k]; 2894e4d965acSSatish Balay start = ai[row]; 2895e4d965acSSatish Balay end = ai[row + 1]; 289604a348a9SBarry Smith for (l = start; l < end; l++) { 2897efb16452SHong Zhang val = aj[l]; 28982205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2899e4d965acSSatish Balay } 2900e4d965acSSatish Balay } 2901e4d965acSSatish Balay } 29029566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2903e4d965acSSatish Balay } 29049a88ca10SBarry Smith } 29059566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29069566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29084dcbc457SBarry Smith } 290917ab2063SBarry Smith 2910ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2911d71ae5a4SJacob Faibussowitsch { 29120513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29133b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29145d0c19d7SBarry Smith const PetscInt *row, *col; 29155d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 291656cd22aeSBarry Smith IS icolp, irowp; 29170298fd71SBarry Smith PetscInt *cwork = NULL; 29180298fd71SBarry Smith PetscScalar *vwork = NULL; 29190513a670SBarry Smith 29203a40ed3dSBarry Smith PetscFunctionBegin; 29219566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29229566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29239566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29249566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29250513a670SBarry Smith 29260513a670SBarry Smith /* determine lengths of permuted rows */ 29279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29282205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29299566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29309566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29319566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29329566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29349566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29350513a670SBarry Smith 29369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29370513a670SBarry Smith for (i = 0; i < m; i++) { 29389566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29392205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29409566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29419566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29420513a670SBarry Smith } 29439566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29442205254eSKarl Rupp 29453c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29462205254eSKarl Rupp 29478c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29489566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29499fe5e383SStefano Zampini #endif 29509566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29519566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29529566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29539566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29549566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29559566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 295648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29580513a670SBarry Smith } 29590513a670SBarry Smith 2960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2961d71ae5a4SJacob Faibussowitsch { 2962cb5b572fSBarry Smith PetscFunctionBegin; 296333f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 296433f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2965be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2966be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29672e5835c6SStefano Zampini const PetscScalar *aa; 2968be6bf707SBarry Smith 29699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 297008401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29719566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29729566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2974cb5b572fSBarry Smith } else { 29759566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2976cb5b572fSBarry Smith } 29773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2978cb5b572fSBarry Smith } 2979cb5b572fSBarry Smith 2980d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2981d71ae5a4SJacob Faibussowitsch { 29826c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29836e111a19SKarl Rupp 29846c0721eeSBarry Smith PetscFunctionBegin; 29856c0721eeSBarry Smith *array = a->a; 29863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29876c0721eeSBarry Smith } 29886c0721eeSBarry Smith 2989d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2990d71ae5a4SJacob Faibussowitsch { 29916c0721eeSBarry Smith PetscFunctionBegin; 2992f38c1e66SStefano Zampini *array = NULL; 29933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29946c0721eeSBarry Smith } 2995273d9f13SBarry Smith 29968229c054SShri Abhyankar /* 29978229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29988229c054SShri Abhyankar have different nonzero structure. 29998229c054SShri Abhyankar */ 3000d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 3001d71ae5a4SJacob Faibussowitsch { 3002b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 3003ec7775f6SShri Abhyankar 3004ec7775f6SShri Abhyankar PetscFunctionBegin; 3005ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3006ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 30078e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 3008b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3009b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30108af7cee1SJed Brown nnz[i] = 0; 30118af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3012b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3013b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30148af7cee1SJed Brown nnz[i]++; 30158af7cee1SJed Brown } 30168af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3017ec7775f6SShri Abhyankar } 30183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3019ec7775f6SShri Abhyankar } 3020ec7775f6SShri Abhyankar 3021d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3022d71ae5a4SJacob Faibussowitsch { 3023b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3024b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3025b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3026b264fe52SHong Zhang 3027b264fe52SHong Zhang PetscFunctionBegin; 3028b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30299566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3031b264fe52SHong Zhang } 3032b264fe52SHong Zhang 3033d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3034d71ae5a4SJacob Faibussowitsch { 3035ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3036ac90fabeSBarry Smith 3037ac90fabeSBarry Smith PetscFunctionBegin; 3038134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3039134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3040134adf20SPierre Jolivet if (e) { 30419566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 304281fa06acSBarry Smith if (e) { 30439566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3044134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 304581fa06acSBarry Smith } 304681fa06acSBarry Smith } 304754c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 304881fa06acSBarry Smith } 3049ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30502e5835c6SStefano Zampini const PetscScalar *xa; 30512e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 305281fa06acSBarry Smith PetscBLASInt one = 1, bnz; 305381fa06acSBarry Smith 30549566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3057792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30609566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30629566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3063ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30649566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3065ac90fabeSBarry Smith } else { 30668229c054SShri Abhyankar Mat B; 30678229c054SShri Abhyankar PetscInt *nnz; 30689566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30699566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30709566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30719566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30729566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30739566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30759566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30769566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30779bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30789566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3079ac90fabeSBarry Smith } 30803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3081ac90fabeSBarry Smith } 3082ac90fabeSBarry Smith 3083d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3084d71ae5a4SJacob Faibussowitsch { 3085354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3086354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3087354c94deSBarry Smith PetscInt i, nz; 3088354c94deSBarry Smith PetscScalar *a; 3089354c94deSBarry Smith 3090354c94deSBarry Smith PetscFunctionBegin; 3091354c94deSBarry Smith nz = aij->nz; 30929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30932205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3095354c94deSBarry Smith #else 3096354c94deSBarry Smith PetscFunctionBegin; 3097354c94deSBarry Smith #endif 30983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3099354c94deSBarry Smith } 3100354c94deSBarry Smith 3101ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3102d71ae5a4SJacob Faibussowitsch { 3103e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3104d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3105e34fafa9SBarry Smith PetscReal atmp; 3106985db425SBarry Smith PetscScalar *x; 3107ce496241SStefano Zampini const MatScalar *aa, *av; 3108e34fafa9SBarry Smith 3109e34fafa9SBarry Smith PetscFunctionBegin; 311028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3112ce496241SStefano Zampini aa = av; 3113e34fafa9SBarry Smith ai = a->i; 3114e34fafa9SBarry Smith aj = a->j; 3115e34fafa9SBarry Smith 31169566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31179566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31189566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 311908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3120e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31219371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31229371c9d4SSatish Balay ai++; 3123e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3124985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31259371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31269371c9d4SSatish Balay x[i] = atmp; 31279371c9d4SSatish Balay if (idx) idx[i] = *aj; 31289371c9d4SSatish Balay } 31299371c9d4SSatish Balay aa++; 31309371c9d4SSatish Balay aj++; 3131985db425SBarry Smith } 3132985db425SBarry Smith } 31339566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3136985db425SBarry Smith } 3137985db425SBarry Smith 3138eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3139eede4a3fSMark Adams { 3140eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3141eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3142eede4a3fSMark Adams PetscScalar *x; 3143eede4a3fSMark Adams const MatScalar *aa, *av; 3144eede4a3fSMark Adams 3145eede4a3fSMark Adams PetscFunctionBegin; 3146eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3147eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3148eede4a3fSMark Adams aa = av; 3149eede4a3fSMark Adams ai = a->i; 3150eede4a3fSMark Adams 3151eede4a3fSMark Adams PetscCall(VecSet(v, 0.0)); 3152eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3153eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3154eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3155eede4a3fSMark Adams for (i = 0; i < m; i++) { 3156eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3157eede4a3fSMark Adams ai++; 3158eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3159eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3160eede4a3fSMark Adams aa++; 3161eede4a3fSMark Adams } 3162eede4a3fSMark Adams } 3163eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3164eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3165eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3166eede4a3fSMark Adams } 3167eede4a3fSMark Adams 3168ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3169d71ae5a4SJacob Faibussowitsch { 3170985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3171d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3172985db425SBarry Smith PetscScalar *x; 3173ce496241SStefano Zampini const MatScalar *aa, *av; 3174985db425SBarry Smith 3175985db425SBarry Smith PetscFunctionBegin; 317628b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3178ce496241SStefano Zampini aa = av; 3179985db425SBarry Smith ai = a->i; 3180985db425SBarry Smith aj = a->j; 3181985db425SBarry Smith 31829566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31839566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31849566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 318508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3186985db425SBarry Smith for (i = 0; i < m; i++) { 31879371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31889371c9d4SSatish Balay ai++; 3189d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31909371c9d4SSatish Balay x[i] = *aa; 31919371c9d4SSatish Balay if (idx) idx[i] = 0; 3192985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3193985db425SBarry Smith x[i] = 0.0; 3194985db425SBarry Smith if (idx) { 3195985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3196985db425SBarry Smith if (aj[j] > j) { 3197985db425SBarry Smith idx[i] = j; 3198985db425SBarry Smith break; 3199985db425SBarry Smith } 3200985db425SBarry Smith } 32011a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 32021a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3203985db425SBarry Smith } 3204985db425SBarry Smith } 3205985db425SBarry Smith for (j = 0; j < ncols; j++) { 32069371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 32079371c9d4SSatish Balay x[i] = *aa; 32089371c9d4SSatish Balay if (idx) idx[i] = *aj; 32099371c9d4SSatish Balay } 32109371c9d4SSatish Balay aa++; 32119371c9d4SSatish Balay aj++; 3212985db425SBarry Smith } 3213985db425SBarry Smith } 32149566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3217985db425SBarry Smith } 3218985db425SBarry Smith 3219ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3220d71ae5a4SJacob Faibussowitsch { 3221c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3222c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3223ce496241SStefano Zampini PetscScalar *x; 3224ce496241SStefano Zampini const MatScalar *aa, *av; 3225c87e5d42SMatthew Knepley 3226c87e5d42SMatthew Knepley PetscFunctionBegin; 32279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3228ce496241SStefano Zampini aa = av; 3229c87e5d42SMatthew Knepley ai = a->i; 3230c87e5d42SMatthew Knepley aj = a->j; 3231c87e5d42SMatthew Knepley 32329566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32339566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32349566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 323508401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3236c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32379371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32389371c9d4SSatish Balay ai++; 3239f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32409371c9d4SSatish Balay x[i] = *aa; 32419371c9d4SSatish Balay if (idx) idx[i] = 0; 3242f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3243f07e67edSHong Zhang x[i] = 0.0; 3244f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3245289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3246f07e67edSHong Zhang if (aj[j] > j) { 3247f07e67edSHong Zhang idx[i] = j; 32482205254eSKarl Rupp break; 32492205254eSKarl Rupp } 3250289a08f5SMatthew Knepley } 3251f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3252f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3253f07e67edSHong Zhang } 3254289a08f5SMatthew Knepley } 3255c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32569371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32579371c9d4SSatish Balay x[i] = *aa; 32589371c9d4SSatish Balay if (idx) idx[i] = *aj; 32599371c9d4SSatish Balay } 32609371c9d4SSatish Balay aa++; 32619371c9d4SSatish Balay aj++; 3262c87e5d42SMatthew Knepley } 3263c87e5d42SMatthew Knepley } 32649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3267c87e5d42SMatthew Knepley } 3268c87e5d42SMatthew Knepley 3269ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3270d71ae5a4SJacob Faibussowitsch { 3271985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3272d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3273d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3274985db425SBarry Smith PetscScalar *x; 3275ce496241SStefano Zampini const MatScalar *aa, *av; 3276985db425SBarry Smith 3277985db425SBarry Smith PetscFunctionBegin; 327828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3280ce496241SStefano Zampini aa = av; 3281985db425SBarry Smith ai = a->i; 3282985db425SBarry Smith aj = a->j; 3283985db425SBarry Smith 32849566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32859566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32869566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 328708401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3288985db425SBarry Smith for (i = 0; i < m; i++) { 32899371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32909371c9d4SSatish Balay ai++; 3291d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32929371c9d4SSatish Balay x[i] = *aa; 32939371c9d4SSatish Balay if (idx) idx[i] = 0; 3294985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3295985db425SBarry Smith x[i] = 0.0; 3296985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3297985db425SBarry Smith for (j = 0; j < ncols; j++) { 3298985db425SBarry Smith if (aj[j] > j) { 3299985db425SBarry Smith idx[i] = j; 3300985db425SBarry Smith break; 3301985db425SBarry Smith } 3302985db425SBarry Smith } 3303fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3304fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3305985db425SBarry Smith } 3306985db425SBarry Smith } 3307985db425SBarry Smith for (j = 0; j < ncols; j++) { 33089371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 33099371c9d4SSatish Balay x[i] = *aa; 33109371c9d4SSatish Balay if (idx) idx[i] = *aj; 33119371c9d4SSatish Balay } 33129371c9d4SSatish Balay aa++; 33139371c9d4SSatish Balay aj++; 3314e34fafa9SBarry Smith } 3315e34fafa9SBarry Smith } 33169566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 33179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 33183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3319e34fafa9SBarry Smith } 3320bbead8a2SBarry Smith 3321ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3322d71ae5a4SJacob Faibussowitsch { 3323bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 332433d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3325bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33260da83c2eSBarry Smith const PetscReal shift = 0.0; 33271a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3328bbead8a2SBarry Smith 3329bbead8a2SBarry Smith PetscFunctionBegin; 3330a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33314a0d0026SBarry Smith if (a->ibdiagvalid) { 33324a0d0026SBarry Smith if (values) *values = a->ibdiag; 33333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33344a0d0026SBarry Smith } 33359566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33364dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3337bbead8a2SBarry Smith diag = a->ibdiag; 3338bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3339bbead8a2SBarry Smith /* factor and invert each block */ 3340bbead8a2SBarry Smith switch (bs) { 3341bbead8a2SBarry Smith case 1: 3342bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33439566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3344ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3345ec1892c8SHong Zhang if (allowzeropivot) { 33467b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33477b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33487b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 335098921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3351ec1892c8SHong Zhang } 3352bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3353bbead8a2SBarry Smith } 3354bbead8a2SBarry Smith break; 3355bbead8a2SBarry Smith case 2: 3356bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33579371c9d4SSatish Balay ij[0] = 2 * i; 33589371c9d4SSatish Balay ij[1] = 2 * i + 1; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3363bbead8a2SBarry Smith diag += 4; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith case 3: 3367bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33689371c9d4SSatish Balay ij[0] = 3 * i; 33699371c9d4SSatish Balay ij[1] = 3 * i + 1; 33709371c9d4SSatish Balay ij[2] = 3 * i + 2; 33719566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33737b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3375bbead8a2SBarry Smith diag += 9; 3376bbead8a2SBarry Smith } 3377bbead8a2SBarry Smith break; 3378bbead8a2SBarry Smith case 4: 3379bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33809371c9d4SSatish Balay ij[0] = 4 * i; 33819371c9d4SSatish Balay ij[1] = 4 * i + 1; 33829371c9d4SSatish Balay ij[2] = 4 * i + 2; 33839371c9d4SSatish Balay ij[3] = 4 * i + 3; 33849566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33867b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3388bbead8a2SBarry Smith diag += 16; 3389bbead8a2SBarry Smith } 3390bbead8a2SBarry Smith break; 3391bbead8a2SBarry Smith case 5: 3392bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33939371c9d4SSatish Balay ij[0] = 5 * i; 33949371c9d4SSatish Balay ij[1] = 5 * i + 1; 33959371c9d4SSatish Balay ij[2] = 5 * i + 2; 33969371c9d4SSatish Balay ij[3] = 5 * i + 3; 33979371c9d4SSatish Balay ij[4] = 5 * i + 4; 33989566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33999566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 34007b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3402bbead8a2SBarry Smith diag += 25; 3403bbead8a2SBarry Smith } 3404bbead8a2SBarry Smith break; 3405bbead8a2SBarry Smith case 6: 3406bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34079371c9d4SSatish Balay ij[0] = 6 * i; 34089371c9d4SSatish Balay ij[1] = 6 * i + 1; 34099371c9d4SSatish Balay ij[2] = 6 * i + 2; 34109371c9d4SSatish Balay ij[3] = 6 * i + 3; 34119371c9d4SSatish Balay ij[4] = 6 * i + 4; 34129371c9d4SSatish Balay ij[5] = 6 * i + 5; 34139566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 34149566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 34157b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3417bbead8a2SBarry Smith diag += 36; 3418bbead8a2SBarry Smith } 3419bbead8a2SBarry Smith break; 3420bbead8a2SBarry Smith case 7: 3421bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34229371c9d4SSatish Balay ij[0] = 7 * i; 34239371c9d4SSatish Balay ij[1] = 7 * i + 1; 34249371c9d4SSatish Balay ij[2] = 7 * i + 2; 34259371c9d4SSatish Balay ij[3] = 7 * i + 3; 34269371c9d4SSatish Balay ij[4] = 7 * i + 4; 34279371c9d4SSatish Balay ij[5] = 7 * i + 5; 3428cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34299566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34309566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34317b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3433bbead8a2SBarry Smith diag += 49; 3434bbead8a2SBarry Smith } 3435bbead8a2SBarry Smith break; 3436bbead8a2SBarry Smith default: 34379566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3438bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3439ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34409566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34427b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3444bbead8a2SBarry Smith diag += bs2; 3445bbead8a2SBarry Smith } 34469566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3447bbead8a2SBarry Smith } 3448bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3450bbead8a2SBarry Smith } 3451bbead8a2SBarry Smith 3452d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3453d71ae5a4SJacob Faibussowitsch { 345473a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3455fff043a9SJunchao Zhang PetscScalar a, *aa; 345673a71a0fSBarry Smith PetscInt m, n, i, j, col; 345773a71a0fSBarry Smith 345873a71a0fSBarry Smith PetscFunctionBegin; 345973a71a0fSBarry Smith if (!x->assembled) { 34609566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 346173a71a0fSBarry Smith for (i = 0; i < m; i++) { 346273a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34639566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 346473a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34659566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 346673a71a0fSBarry Smith } 346773a71a0fSBarry Smith } 3468e2ce353bSJunchao Zhang } else { 34699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34709566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3472e2ce353bSJunchao Zhang } 34739566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34749566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 347673a71a0fSBarry Smith } 347773a71a0fSBarry Smith 3478679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3479d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3480d71ae5a4SJacob Faibussowitsch { 3481679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3482679944adSJunchao Zhang PetscScalar a; 3483679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3484679944adSJunchao Zhang 3485679944adSJunchao Zhang PetscFunctionBegin; 3486679944adSJunchao Zhang nskip = high - low; 34879566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3488679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3489679944adSJunchao Zhang for (i = 0; i < m; i++) { 3490679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34919566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3492679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3493679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34949566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3495679944adSJunchao Zhang } 3496e2ce353bSJunchao Zhang } 34979566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34989566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3500679944adSJunchao Zhang } 3501679944adSJunchao Zhang 35020a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3503cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3504cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3505cb5b572fSBarry Smith MatMult_SeqAIJ, 350697304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 35077c922b88SBarry Smith MatMultTranspose_SeqAIJ, 35087c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 3512f4259b30SLisandro Dalcin /* 10*/ NULL, 3513cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3514f4259b30SLisandro Dalcin NULL, 351541f059aeSBarry Smith MatSOR_SeqAIJ, 351691e9d3e2SHong Zhang MatTranspose_SeqAIJ, 351797304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3518cb5b572fSBarry Smith MatEqual_SeqAIJ, 3519cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3520cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3521cb5b572fSBarry Smith MatNorm_SeqAIJ, 3522f4259b30SLisandro Dalcin /* 20*/ NULL, 3523cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3524cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3525cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3526d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3527f4259b30SLisandro Dalcin NULL, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 3530f4259b30SLisandro Dalcin NULL, 353126cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3532f4259b30SLisandro Dalcin NULL, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin NULL, 3535f4259b30SLisandro Dalcin NULL, 3536d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3537f4259b30SLisandro Dalcin NULL, 3538f4259b30SLisandro Dalcin NULL, 3539cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3540f4259b30SLisandro Dalcin NULL, 3541d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35427dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3543cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3544cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3545cb5b572fSBarry Smith MatCopy_SeqAIJ, 3546d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3547cb5b572fSBarry Smith MatScale_SeqAIJ, 35487d68702bSBarry Smith MatShift_SeqAIJ, 354979299369SBarry Smith MatDiagonalSet_SeqAIJ, 35506e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 355173a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35523b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35533b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35543b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3555a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 355693dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559cda55fadSBarry Smith MatPermute_SeqAIJ, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin /* 59*/ NULL, 3562b9b97703SBarry Smith MatDestroy_SeqAIJ, 3563b9b97703SBarry Smith MatView_SeqAIJ, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin /* 64*/ NULL, 3567321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 3571d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3572c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin /* 74*/ NULL, 35773acb8795SBarry Smith MatFDColoringApply_AIJ, 3578f4259b30SLisandro Dalcin NULL, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 35816ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 3584f4259b30SLisandro Dalcin NULL, 3585bc011b1eSHong Zhang MatLoad_SeqAIJ, 3586d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35871cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin /* 89*/ NULL, 3592f4259b30SLisandro Dalcin NULL, 359326be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 35968fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 35996fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3600f4259b30SLisandro Dalcin NULL, 36014222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3602f4259b30SLisandro Dalcin NULL, 3603f4259b30SLisandro Dalcin NULL, 360487d4246cSBarry Smith MatConjugate_SeqAIJ, 3605f4259b30SLisandro Dalcin NULL, 3606d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 360799cafbc1SBarry Smith MatRealPart_SeqAIJ, 3608f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin NULL, 3611cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3612f4259b30SLisandro Dalcin NULL, 36132af78befSBarry Smith MatGetRowMin_SeqAIJ, 3614f4259b30SLisandro Dalcin NULL, 3615599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3616f4259b30SLisandro Dalcin /*114*/ NULL, 3617f4259b30SLisandro Dalcin NULL, 3618f4259b30SLisandro Dalcin NULL, 3619f4259b30SLisandro Dalcin NULL, 3620f4259b30SLisandro Dalcin NULL, 3621f4259b30SLisandro Dalcin /*119*/ NULL, 3622f4259b30SLisandro Dalcin NULL, 3623f4259b30SLisandro Dalcin NULL, 3624f4259b30SLisandro Dalcin NULL, 3625b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36260716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3627a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 362837868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36290da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3630f4259b30SLisandro Dalcin NULL, 3631f4259b30SLisandro Dalcin /*129*/ NULL, 3632f4259b30SLisandro Dalcin NULL, 3633f4259b30SLisandro Dalcin NULL, 363475648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3635b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3636b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36372b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3638f4259b30SLisandro Dalcin NULL, 3639f4259b30SLisandro Dalcin NULL, 36403964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3641f4259b30SLisandro Dalcin /*139*/ NULL, 3642f4259b30SLisandro Dalcin NULL, 3643f4259b30SLisandro Dalcin NULL, 36443a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36459c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36464222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36474222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3648f4259b30SLisandro Dalcin NULL, 364972833a62Smarkadams4 NULL, 365072833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36512d776b49SBarry Smith NULL, 3652dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3653eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 3654eede4a3fSMark Adams MatGetRowSumAbs_SeqAIJ}; 365517ab2063SBarry Smith 3656ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3657d71ae5a4SJacob Faibussowitsch { 3658bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 365997f1f81fSBarry Smith PetscInt i, nz, n; 3660bef8e0ddSBarry Smith 3661bef8e0ddSBarry Smith PetscFunctionBegin; 3662bef8e0ddSBarry Smith nz = aij->maxnz; 3663d0f46423SBarry Smith n = mat->rmap->n; 3664ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3665bef8e0ddSBarry Smith aij->nz = nz; 3666ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3668bef8e0ddSBarry Smith } 3669bef8e0ddSBarry Smith 3670a3bb6f32SFande Kong /* 3671ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3672ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3673ddea5d60SJunchao Zhang */ 3674d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3675d71ae5a4SJacob Faibussowitsch { 3676a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3677eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3678eec179cfSJacob Faibussowitsch PetscHashIter tpos; 367925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 368025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3681a3bb6f32SFande Kong 3682a3bb6f32SFande Kong PetscFunctionBegin; 3683a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36844f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3685a3bb6f32SFande Kong /* use a table */ 3686eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3687a3bb6f32SFande Kong ec = 0; 368825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3690eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3691a3bb6f32SFande Kong if (!data) { 3692a3bb6f32SFande Kong /* one based table */ 3693c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3694a3bb6f32SFande Kong } 3695a3bb6f32SFande Kong } 3696a3bb6f32SFande Kong /* form array of columns we need */ 36979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3698eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3699eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3700eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3701eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3702eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3703a3bb6f32SFande Kong gid--; 3704a3bb6f32SFande Kong lid--; 3705a3bb6f32SFande Kong garray[lid] = gid; 3706a3bb6f32SFande Kong } 37079566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3708eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3709c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3710a3bb6f32SFande Kong /* compact out the extra columns in B */ 371125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 371225b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3713eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3714a3bb6f32SFande Kong lid--; 371525b670f0SStefano Zampini jj[i] = lid; 3716a3bb6f32SFande Kong } 37179566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3718eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 37199566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 37209566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 37219566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3723a3bb6f32SFande Kong } 3724a3bb6f32SFande Kong 3725bef8e0ddSBarry Smith /*@ 3726bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3727bef8e0ddSBarry Smith in the matrix. 3728bef8e0ddSBarry Smith 3729bef8e0ddSBarry Smith Input Parameters: 373011a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3731bef8e0ddSBarry Smith - indices - the column indices 3732bef8e0ddSBarry Smith 373315091d37SBarry Smith Level: advanced 373415091d37SBarry Smith 3735bef8e0ddSBarry Smith Notes: 3736bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3737bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 373811a5261eSBarry Smith of the `MatSetValues()` operation. 3739bef8e0ddSBarry Smith 3740bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 374111a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3742bef8e0ddSBarry Smith 374311a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3744bef8e0ddSBarry Smith 3745b9617806SBarry Smith The indices should start with zero, not one. 3746b9617806SBarry Smith 37471cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3748bef8e0ddSBarry Smith @*/ 3749d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3750d71ae5a4SJacob Faibussowitsch { 3751bef8e0ddSBarry Smith PetscFunctionBegin; 37520700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37534f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3754cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3756bef8e0ddSBarry Smith } 3757bef8e0ddSBarry Smith 3758ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3759d71ae5a4SJacob Faibussowitsch { 3760be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3761d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3762be6bf707SBarry Smith 3763be6bf707SBarry Smith PetscFunctionBegin; 376428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3765be6bf707SBarry Smith 3766be6bf707SBarry Smith /* allocate space for values if not already there */ 37674dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3768be6bf707SBarry Smith 3769be6bf707SBarry Smith /* copy values over */ 37709566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3772be6bf707SBarry Smith } 3773be6bf707SBarry Smith 3774be6bf707SBarry Smith /*@ 377520f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3776be6bf707SBarry Smith nonlinear portion. 3777be6bf707SBarry Smith 3778c3339decSBarry Smith Logically Collect 3779be6bf707SBarry Smith 378027430b45SBarry Smith Input Parameter: 378111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3782be6bf707SBarry Smith 378315091d37SBarry Smith Level: advanced 378415091d37SBarry Smith 37852920cce0SJacob Faibussowitsch Example Usage: 378627430b45SBarry Smith .vb 37872ef1f0ffSBarry Smith Using SNES 378827430b45SBarry Smith Create Jacobian matrix 378927430b45SBarry Smith Set linear terms into matrix 379027430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 379127430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 379227430b45SBarry Smith boundary conditions again will not change the nonzero structure 379327430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 379427430b45SBarry Smith MatStoreValues(mat); 379527430b45SBarry Smith Call SNESSetJacobian() with matrix 379627430b45SBarry Smith In your Jacobian routine 379727430b45SBarry Smith MatRetrieveValues(mat); 379827430b45SBarry Smith Set nonlinear terms in matrix 3799be6bf707SBarry Smith 380027430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 380127430b45SBarry Smith // build linear portion of Jacobian 380227430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 380327430b45SBarry Smith MatStoreValues(mat); 380427430b45SBarry Smith loop over nonlinear iterations 380527430b45SBarry Smith MatRetrieveValues(mat); 380627430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 380727430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 380827430b45SBarry Smith Solve linear system with Jacobian 380927430b45SBarry Smith endloop 381027430b45SBarry Smith .ve 3811be6bf707SBarry Smith 3812be6bf707SBarry Smith Notes: 3813da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 381411a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3815be6bf707SBarry Smith calling this routine. 3816be6bf707SBarry Smith 38170c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38180c468ba9SBarry Smith and does not allocated additional space. 38190c468ba9SBarry Smith 3820fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3821be6bf707SBarry Smith @*/ 3822d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3823d71ae5a4SJacob Faibussowitsch { 3824be6bf707SBarry Smith PetscFunctionBegin; 38250700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 382628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 382728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3828cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3830be6bf707SBarry Smith } 3831be6bf707SBarry Smith 3832ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3833d71ae5a4SJacob Faibussowitsch { 3834be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3835d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3836be6bf707SBarry Smith 3837be6bf707SBarry Smith PetscFunctionBegin; 383828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 383928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3840be6bf707SBarry Smith /* copy values over */ 38419566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3843be6bf707SBarry Smith } 3844be6bf707SBarry Smith 3845be6bf707SBarry Smith /*@ 384620f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3847be6bf707SBarry Smith 3848c3339decSBarry Smith Logically Collect 3849be6bf707SBarry Smith 38502fe279fdSBarry Smith Input Parameter: 385111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3852be6bf707SBarry Smith 385315091d37SBarry Smith Level: advanced 385415091d37SBarry Smith 38551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3856be6bf707SBarry Smith @*/ 3857d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3858d71ae5a4SJacob Faibussowitsch { 3859be6bf707SBarry Smith PetscFunctionBegin; 38600700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 386128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 386228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3863cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3865be6bf707SBarry Smith } 3866be6bf707SBarry Smith 386717ab2063SBarry Smith /*@C 386811a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38690d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 387020f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 387120f4b53cSBarry Smith (or the array `nnz`). 387217ab2063SBarry Smith 3873d083f849SBarry Smith Collective 3874db81eaa0SLois Curfman McInnes 387517ab2063SBarry Smith Input Parameters: 387611a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 387717ab2063SBarry Smith . m - number of rows 387817ab2063SBarry Smith . n - number of columns 387917ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 388051c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38810298fd71SBarry Smith (possibly different for each row) or NULL 388217ab2063SBarry Smith 388317ab2063SBarry Smith Output Parameter: 3884416022c9SBarry Smith . A - the matrix 388517ab2063SBarry Smith 38862ef1f0ffSBarry Smith Options Database Keys: 38872ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38882ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38892ef1f0ffSBarry Smith 38902ef1f0ffSBarry Smith Level: intermediate 3891175b88e8SBarry Smith 3892b259b22eSLois Curfman McInnes Notes: 389377433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 389477433607SBarry Smith 38952ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 389649a6f317SBarry Smith 38972ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38982ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38990002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 39002ef1f0ffSBarry Smith either one (as in Fortran) or zero. 390117ab2063SBarry Smith 390220f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39032ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 390420f4b53cSBarry Smith allocation. 390517ab2063SBarry Smith 3906682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 39074fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3908682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 39096c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 39106c7ebb05SLois Curfman McInnes 39111cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 391217ab2063SBarry Smith @*/ 3913d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3914d71ae5a4SJacob Faibussowitsch { 39153a40ed3dSBarry Smith PetscFunctionBegin; 39169566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 39179566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 39189566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 39199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 39203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3921273d9f13SBarry Smith } 3922273d9f13SBarry Smith 3923273d9f13SBarry Smith /*@C 3924273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3925273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3926273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3927273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3928273d9f13SBarry Smith 3929d083f849SBarry Smith Collective 3930273d9f13SBarry Smith 3931273d9f13SBarry Smith Input Parameters: 39321c4f3114SJed Brown + B - The matrix 3933273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3934273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39350298fd71SBarry Smith (possibly different for each row) or NULL 3936273d9f13SBarry Smith 39372ef1f0ffSBarry Smith Options Database Keys: 39382ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39392ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39402ef1f0ffSBarry Smith 39412ef1f0ffSBarry Smith Level: intermediate 39422ef1f0ffSBarry Smith 3943273d9f13SBarry Smith Notes: 39442ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 394549a6f317SBarry Smith 394611a5261eSBarry Smith The `MATSEQAIJ` format also called 39472ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3948273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3949273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3950273d9f13SBarry Smith 39512ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39522ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39532ef1f0ffSBarry Smith allocation. 3954273d9f13SBarry Smith 395511a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3956aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3957aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3958aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3959aa95bbe8SBarry Smith 396011a5261eSBarry Smith Developer Notes: 396111a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3962a96a251dSBarry Smith entries or columns indices 3963a96a251dSBarry Smith 3964273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3965273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3966273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3967273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3968273d9f13SBarry Smith 39691cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3970db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3971273d9f13SBarry Smith @*/ 3972d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3973d71ae5a4SJacob Faibussowitsch { 3974a23d5eceSKris Buschelman PetscFunctionBegin; 39756ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39766ba663aaSJed Brown PetscValidType(B, 1); 3977cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3979a23d5eceSKris Buschelman } 3980a23d5eceSKris Buschelman 3981d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3982d71ae5a4SJacob Faibussowitsch { 3983ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39842576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 398597f1f81fSBarry Smith PetscInt i; 3986273d9f13SBarry Smith 3987273d9f13SBarry Smith PetscFunctionBegin; 3988ad79cf63SBarry Smith if (B->hash_active) { 3989aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3990ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3991ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3992ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3993ad79cf63SBarry Smith } 39942576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3995a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3996c461c341SBarry Smith skipallocation = PETSC_TRUE; 3997c461c341SBarry Smith nz = 0; 3998c461c341SBarry Smith } 39999566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 40009566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4001899cda47SBarry Smith 4002435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 400308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 4004cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 4005d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 400608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 400708401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 4008b73539f3SBarry Smith } 4009b73539f3SBarry Smith } 4010b73539f3SBarry Smith 4011273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 4012ab93d7beSBarry Smith if (!skipallocation) { 40134dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 4014071fcb05SBarry Smith if (!b->ilen) { 4015071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40169566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 4017071fcb05SBarry Smith } else { 40189566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 40192ee49352SLisandro Dalcin } 4020aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 4021273d9f13SBarry Smith if (!nnz) { 4022435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4023c62bd62aSJed Brown else if (nz < 0) nz = 1; 40245d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4025d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4026c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4027273d9f13SBarry Smith } else { 4028c73702f5SBarry Smith PetscInt64 nz64 = 0; 40299371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40309371c9d4SSatish Balay b->imax[i] = nnz[i]; 40319371c9d4SSatish Balay nz64 += nnz[i]; 40329371c9d4SSatish Balay } 40339566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4034273d9f13SBarry Smith } 4035ab93d7beSBarry Smith 4036273d9f13SBarry Smith /* allocate the matrix space */ 403753dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40389566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4039396832f4SHong Zhang if (B->structure_only) { 40409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4042396832f4SHong Zhang } else { 40439566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4044396832f4SHong Zhang } 4045bfeeae90SHong Zhang b->i[0] = 0; 4046ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4047396832f4SHong Zhang if (B->structure_only) { 4048396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4049396832f4SHong Zhang b->free_a = PETSC_FALSE; 4050396832f4SHong Zhang } else { 4051273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4052e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4053396832f4SHong Zhang } 4054e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4055c461c341SBarry Smith } else { 4056e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4057e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4058c461c341SBarry Smith } 4059273d9f13SBarry Smith 4060846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4061846b4da1SFande Kong /* reserve user-requested sparsity */ 40629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4063846b4da1SFande Kong } 4064846b4da1SFande Kong 4065273d9f13SBarry Smith b->nz = 0; 4066273d9f13SBarry Smith b->maxnz = nz; 4067273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40681baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4069cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4070cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40715519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40725519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40735519a089SJose E. Roman */ 40745519a089SJose E. Roman B->nonzerostate++; 40753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4076273d9f13SBarry Smith } 4077273d9f13SBarry Smith 4078ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4079d71ae5a4SJacob Faibussowitsch { 4080846b4da1SFande Kong Mat_SeqAIJ *a; 4081a5bbaf83SFande Kong PetscInt i; 40821f14be2bSBarry Smith PetscBool skipreset; 4083846b4da1SFande Kong 4084846b4da1SFande Kong PetscFunctionBegin; 4085846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 408614d0e64fSAlex Lindsay 408714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40883ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 408914d0e64fSAlex Lindsay 4090846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40912c814fdeSFande Kong /* if no saved info, we error out */ 409228b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40932c814fdeSFande Kong 40941f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40952c814fdeSFande Kong 40961f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40971f14be2bSBarry Smith if (!skipreset) { 40989566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40999566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4100846b4da1SFande Kong a->i[0] = 0; 4101ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4102846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4103846b4da1SFande Kong a->nz = 0; 4104846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4105846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4106846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4107846b4da1SFande Kong A->assembled = PETSC_FALSE; 41081f14be2bSBarry Smith } 41093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4110846b4da1SFande Kong } 4111846b4da1SFande Kong 411258d36128SBarry Smith /*@ 411311a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4114a1661176SMatthew Knepley 4115a1661176SMatthew Knepley Input Parameters: 4116a1661176SMatthew Knepley + B - the matrix 4117*d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4118*d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4119*d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4120a1661176SMatthew Knepley 4121a1661176SMatthew Knepley Level: developer 4122a1661176SMatthew Knepley 41236a9b8d82SBarry Smith Notes: 41242ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 412558d36128SBarry Smith 41266a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41276a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41286a9b8d82SBarry Smith 41296a9b8d82SBarry Smith Developer Notes: 41302ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41312ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41326a9b8d82SBarry Smith 413311a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41346a9b8d82SBarry Smith 4135fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4136a1661176SMatthew Knepley @*/ 4137d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4138d71ae5a4SJacob Faibussowitsch { 4139a1661176SMatthew Knepley PetscFunctionBegin; 41400700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41416ba663aaSJed Brown PetscValidType(B, 1); 4142cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4144a1661176SMatthew Knepley } 4145a1661176SMatthew Knepley 4146ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4147d71ae5a4SJacob Faibussowitsch { 4148a1661176SMatthew Knepley PetscInt i; 4149a1661176SMatthew Knepley PetscInt m, n; 4150a1661176SMatthew Knepley PetscInt nz; 41516a9b8d82SBarry Smith PetscInt *nnz; 4152a1661176SMatthew Knepley 4153a1661176SMatthew Knepley PetscFunctionBegin; 4154aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4155779a8d59SSatish Balay 41569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41579566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4158779a8d59SSatish Balay 41599566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4161a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4162b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 416308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4164a1661176SMatthew Knepley nnz[i] = nz; 4165a1661176SMatthew Knepley } 41669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41679566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4168a1661176SMatthew Knepley 41698e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4170a1661176SMatthew Knepley 41719566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41729566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4173a1661176SMatthew Knepley 41749566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4176a1661176SMatthew Knepley } 4177a1661176SMatthew Knepley 4178ad7e164aSPierre Jolivet /*@ 41792ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4180ad7e164aSPierre Jolivet 4181ad7e164aSPierre Jolivet Input Parameters: 4182ad7e164aSPierre Jolivet + A - left-hand side matrix 4183ad7e164aSPierre Jolivet . B - right-hand side matrix 418411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4185ad7e164aSPierre Jolivet 4186ad7e164aSPierre Jolivet Output Parameter: 41872ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4188ad7e164aSPierre Jolivet 4189ad7e164aSPierre Jolivet Level: intermediate 4190ad7e164aSPierre Jolivet 419111a5261eSBarry Smith Note: 419211a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4193ad7e164aSPierre Jolivet 41941cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4195ad7e164aSPierre Jolivet @*/ 4196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4197d71ae5a4SJacob Faibussowitsch { 4198ad7e164aSPierre Jolivet PetscFunctionBegin; 4199ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4200ad7e164aSPierre Jolivet PetscValidType(A, 1); 4201ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4202ad7e164aSPierre Jolivet PetscValidType(B, 2); 42034f572ea9SToby Isaac PetscAssertPointer(C, 4); 4204ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4205ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4206ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4207ad7e164aSPierre Jolivet } 4208cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 42093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4210ad7e164aSPierre Jolivet } 4211ad7e164aSPierre Jolivet 4212ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4213d71ae5a4SJacob Faibussowitsch { 4214ad7e164aSPierre Jolivet Mat newmat; 4215ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4216ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4217ad7e164aSPierre Jolivet PetscScalar *v; 4218fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4219ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4220ad7e164aSPierre Jolivet PetscBool flg; 4221ad7e164aSPierre Jolivet 4222ad7e164aSPierre Jolivet PetscFunctionBegin; 422328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 422428b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 422528b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 422628b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42279566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 422828b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4229aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4230ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42319566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42329566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42339566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42349566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4235ad7e164aSPierre Jolivet i[0] = 0; 4236ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4237ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4238ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4239ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4240ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4241ad7e164aSPierre Jolivet } 4242ad7e164aSPierre Jolivet } 4243ad7e164aSPierre Jolivet } 42449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4245ad7e164aSPierre Jolivet *C = newmat; 42469566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4247ad7e164aSPierre Jolivet nnz = 0; 4248ad7e164aSPierre Jolivet } 42499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4252ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4253ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4254ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4255ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4256ad7e164aSPierre Jolivet } 4257ad7e164aSPierre Jolivet } 4258ad7e164aSPierre Jolivet } 42599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4263ad7e164aSPierre Jolivet } 4264ad7e164aSPierre Jolivet 4265c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4266af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4267170fe5c8SBarry Smith 4268170fe5c8SBarry Smith /* 4269170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4270170fe5c8SBarry Smith 4271170fe5c8SBarry Smith n p p 42722da392ccSBarry Smith [ ] [ ] [ ] 42732da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42742da392ccSBarry Smith [ ] [ ] [ ] 4275170fe5c8SBarry Smith 4276170fe5c8SBarry Smith */ 4277d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4278d71ae5a4SJacob Faibussowitsch { 4279170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4280170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4281170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 428286214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4283170fe5c8SBarry Smith const PetscInt *ii, *idx; 4284170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4285170fe5c8SBarry Smith PetscScalar *c, *c_q; 428686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 428786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4288170fe5c8SBarry Smith 4289170fe5c8SBarry Smith PetscFunctionBegin; 4290d0f46423SBarry Smith m = A->rmap->n; 4291d0f46423SBarry Smith n = A->cmap->n; 4292d0f46423SBarry Smith p = B->cmap->n; 4293170fe5c8SBarry Smith a = sub_a->v; 4294170fe5c8SBarry Smith b = sub_b->a; 4295170fe5c8SBarry Smith c = sub_c->v; 429686214ceeSStefano Zampini if (clda == m) { 42979566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 429886214ceeSStefano Zampini } else { 429986214ceeSStefano Zampini for (j = 0; j < p; j++) 43009371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 430186214ceeSStefano Zampini } 4302170fe5c8SBarry Smith ii = sub_b->i; 4303170fe5c8SBarry Smith idx = sub_b->j; 4304170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4305170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4306170fe5c8SBarry Smith while (q-- > 0) { 430786214ceeSStefano Zampini c_q = c + clda * (*idx); 430886214ceeSStefano Zampini a_q = a + alda * i; 4309854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4310170fe5c8SBarry Smith idx++; 4311170fe5c8SBarry Smith b++; 4312170fe5c8SBarry Smith } 4313170fe5c8SBarry Smith } 43143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4315170fe5c8SBarry Smith } 4316170fe5c8SBarry Smith 4317d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4318d71ae5a4SJacob Faibussowitsch { 4319d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 432086214ceeSStefano Zampini PetscBool cisdense; 4321170fe5c8SBarry Smith 4322170fe5c8SBarry Smith PetscFunctionBegin; 432308401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43249566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43259566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4326d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 432748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43289566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4329d73949e8SHong Zhang 43304222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4332170fe5c8SBarry Smith } 4333170fe5c8SBarry Smith 43340bad9183SKris Buschelman /*MC 4335fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43360bad9183SKris Buschelman based on compressed sparse row format. 43370bad9183SKris Buschelman 43382ef1f0ffSBarry Smith Options Database Key: 43390bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43400bad9183SKris Buschelman 43410bad9183SKris Buschelman Level: beginner 43420bad9183SKris Buschelman 43430cd7f59aSBarry Smith Notes: 43442ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43450cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43460cd7f59aSBarry Smith in the matrix 43470cd7f59aSBarry Smith 434811a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 434911a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43500cd7f59aSBarry Smith 435111a5261eSBarry Smith Developer Note: 43522ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43530cd7f59aSBarry Smith 43541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43550bad9183SKris Buschelman M*/ 43560bad9183SKris Buschelman 4357ccd284c7SBarry Smith /*MC 4358ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4359ccd284c7SBarry Smith 436011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 436111a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 436211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4363ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4364ccd284c7SBarry Smith the above preallocation routines for simplicity. 4365ccd284c7SBarry Smith 43662ef1f0ffSBarry Smith Options Database Key: 436711a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4368ccd284c7SBarry Smith 43692ef1f0ffSBarry Smith Level: beginner 43702ef1f0ffSBarry Smith 437111a5261eSBarry Smith Note: 437211a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4373ccd284c7SBarry Smith enough exist. 4374ccd284c7SBarry Smith 43751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4376ccd284c7SBarry Smith M*/ 4377ccd284c7SBarry Smith 4378ccd284c7SBarry Smith /*MC 4379ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4380ccd284c7SBarry Smith 43812ef1f0ffSBarry Smith Options Database Key: 43822ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43832ef1f0ffSBarry Smith 43842ef1f0ffSBarry Smith Level: beginner 43852ef1f0ffSBarry Smith 43862ef1f0ffSBarry Smith Note: 438711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 438811a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 438911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4390ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4391ccd284c7SBarry Smith the above preallocation routines for simplicity. 4392ccd284c7SBarry Smith 43931cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4394ccd284c7SBarry Smith M*/ 4395ccd284c7SBarry Smith 43967906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43977906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43987906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43997906f579SHong Zhang #endif 4400d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4401d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4402d24d4204SJose E. Roman #endif 44037906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 44047906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 44057906f579SHong Zhang #endif 44067906f579SHong Zhang 4407d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4408c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 44094222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 44107906f579SHong Zhang 44118c778c55SBarry Smith /*@C 441211a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 44138c778c55SBarry Smith 44148c778c55SBarry Smith Not Collective 44158c778c55SBarry Smith 44168c778c55SBarry Smith Input Parameter: 4417fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44188c778c55SBarry Smith 44198c778c55SBarry Smith Output Parameter: 44208c778c55SBarry Smith . array - pointer to the data 44218c778c55SBarry Smith 44228c778c55SBarry Smith Level: intermediate 44238c778c55SBarry Smith 4424fe59aa6dSJacob Faibussowitsch Fortran Notes: 44250ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44260ab4885dSBarry Smith 44271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44288c778c55SBarry Smith @*/ 4429d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4430d71ae5a4SJacob Faibussowitsch { 4431d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44328c778c55SBarry Smith 44338c778c55SBarry Smith PetscFunctionBegin; 4434d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44359566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4436d67d9f35SJunchao Zhang } else { 4437d67d9f35SJunchao Zhang *array = aij->a; 4438d67d9f35SJunchao Zhang } 44393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4440d67d9f35SJunchao Zhang } 4441d67d9f35SJunchao Zhang 4442d67d9f35SJunchao Zhang /*@C 444311a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4444d67d9f35SJunchao Zhang 4445d67d9f35SJunchao Zhang Not Collective 4446d67d9f35SJunchao Zhang 4447d67d9f35SJunchao Zhang Input Parameters: 4448fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4449d67d9f35SJunchao Zhang - array - pointer to the data 4450d67d9f35SJunchao Zhang 4451d67d9f35SJunchao Zhang Level: intermediate 4452d67d9f35SJunchao Zhang 4453fe59aa6dSJacob Faibussowitsch Fortran Notes: 44540ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44550ab4885dSBarry Smith 44561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4457d67d9f35SJunchao Zhang @*/ 4458d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4459d71ae5a4SJacob Faibussowitsch { 4460d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4461d67d9f35SJunchao Zhang 4462d67d9f35SJunchao Zhang PetscFunctionBegin; 4463d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44649566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4465d67d9f35SJunchao Zhang } else { 4466d67d9f35SJunchao Zhang *array = NULL; 4467d67d9f35SJunchao Zhang } 44689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44699566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44718c778c55SBarry Smith } 44728c778c55SBarry Smith 447321e72a00SBarry Smith /*@C 447411a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44758f1ea47aSStefano Zampini 44760ab4885dSBarry Smith Not Collective; No Fortran Support 44778f1ea47aSStefano Zampini 44788f1ea47aSStefano Zampini Input Parameter: 4479fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44808f1ea47aSStefano Zampini 44818f1ea47aSStefano Zampini Output Parameter: 44828f1ea47aSStefano Zampini . array - pointer to the data 44838f1ea47aSStefano Zampini 44848f1ea47aSStefano Zampini Level: intermediate 44858f1ea47aSStefano Zampini 44861cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44878f1ea47aSStefano Zampini @*/ 4488d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4489d71ae5a4SJacob Faibussowitsch { 4490d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44918f1ea47aSStefano Zampini 44928f1ea47aSStefano Zampini PetscFunctionBegin; 4493d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44949566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4495d67d9f35SJunchao Zhang } else { 4496d67d9f35SJunchao Zhang *array = aij->a; 4497d67d9f35SJunchao Zhang } 44983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44998f1ea47aSStefano Zampini } 45008f1ea47aSStefano Zampini 45018f1ea47aSStefano Zampini /*@C 450211a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 45038f1ea47aSStefano Zampini 45040ab4885dSBarry Smith Not Collective; No Fortran Support 45058f1ea47aSStefano Zampini 45068f1ea47aSStefano Zampini Input Parameter: 4507fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 45088f1ea47aSStefano Zampini 45098f1ea47aSStefano Zampini Output Parameter: 45108f1ea47aSStefano Zampini . array - pointer to the data 45118f1ea47aSStefano Zampini 45128f1ea47aSStefano Zampini Level: intermediate 45138f1ea47aSStefano Zampini 45141cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45158f1ea47aSStefano Zampini @*/ 4516d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4517d71ae5a4SJacob Faibussowitsch { 4518d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 45198f1ea47aSStefano Zampini 45208f1ea47aSStefano Zampini PetscFunctionBegin; 4521d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45229566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4523d67d9f35SJunchao Zhang } else { 4524d67d9f35SJunchao Zhang *array = NULL; 4525d67d9f35SJunchao Zhang } 45263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4527d67d9f35SJunchao Zhang } 4528d67d9f35SJunchao Zhang 4529d67d9f35SJunchao Zhang /*@C 453011a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4531d67d9f35SJunchao Zhang 45320ab4885dSBarry Smith Not Collective; No Fortran Support 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang Input Parameter: 4535fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4536d67d9f35SJunchao Zhang 4537d67d9f35SJunchao Zhang Output Parameter: 4538d67d9f35SJunchao Zhang . array - pointer to the data 4539d67d9f35SJunchao Zhang 4540d67d9f35SJunchao Zhang Level: intermediate 4541d67d9f35SJunchao Zhang 45421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4543d67d9f35SJunchao Zhang @*/ 4544d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4545d71ae5a4SJacob Faibussowitsch { 4546d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4547d67d9f35SJunchao Zhang 4548d67d9f35SJunchao Zhang PetscFunctionBegin; 4549d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45509566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4551d67d9f35SJunchao Zhang } else { 4552d67d9f35SJunchao Zhang *array = aij->a; 4553d67d9f35SJunchao Zhang } 45549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45559566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4557d67d9f35SJunchao Zhang } 4558d67d9f35SJunchao Zhang 4559d67d9f35SJunchao Zhang /*@C 4560d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4561d67d9f35SJunchao Zhang 45620ab4885dSBarry Smith Not Collective; No Fortran Support 4563d67d9f35SJunchao Zhang 4564d67d9f35SJunchao Zhang Input Parameter: 4565fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4566d67d9f35SJunchao Zhang 4567d67d9f35SJunchao Zhang Output Parameter: 4568d67d9f35SJunchao Zhang . array - pointer to the data 4569d67d9f35SJunchao Zhang 4570d67d9f35SJunchao Zhang Level: intermediate 4571d67d9f35SJunchao Zhang 45721cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4573d67d9f35SJunchao Zhang @*/ 4574d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4575d71ae5a4SJacob Faibussowitsch { 4576d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4577d67d9f35SJunchao Zhang 4578d67d9f35SJunchao Zhang PetscFunctionBegin; 4579d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45809566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4581d67d9f35SJunchao Zhang } else { 4582d67d9f35SJunchao Zhang *array = NULL; 4583d67d9f35SJunchao Zhang } 45843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45858f1ea47aSStefano Zampini } 45868f1ea47aSStefano Zampini 45878f1ea47aSStefano Zampini /*@C 458811a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45897ee59b9bSJunchao Zhang 45900ab4885dSBarry Smith Not Collective; No Fortran Support 45917ee59b9bSJunchao Zhang 45927ee59b9bSJunchao Zhang Input Parameter: 459311a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45947ee59b9bSJunchao Zhang 45957ee59b9bSJunchao Zhang Output Parameters: 45967ee59b9bSJunchao Zhang + i - row map array of the matrix 45977ee59b9bSJunchao Zhang . j - column index array of the matrix 45987ee59b9bSJunchao Zhang . a - data array of the matrix 4599fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 46007ee59b9bSJunchao Zhang 4601fe59aa6dSJacob Faibussowitsch Level: developer 46022ef1f0ffSBarry Smith 46037ee59b9bSJunchao Zhang Notes: 46042ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 46057ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 46067ee59b9bSJunchao Zhang 46077ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 46082ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 46097ee59b9bSJunchao Zhang 46101cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 46117ee59b9bSJunchao Zhang @*/ 4612d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4613d71ae5a4SJacob Faibussowitsch { 46147ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 46157ee59b9bSJunchao Zhang 46167ee59b9bSJunchao Zhang PetscFunctionBegin; 46177ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 46187ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46197ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 46207ee59b9bSJunchao Zhang } else { 46217ee59b9bSJunchao Zhang if (i) *i = aij->i; 46227ee59b9bSJunchao Zhang if (j) *j = aij->j; 46237ee59b9bSJunchao Zhang if (a) *a = aij->a; 46247ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46257ee59b9bSJunchao Zhang } 46263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46277ee59b9bSJunchao Zhang } 46287ee59b9bSJunchao Zhang 46297ee59b9bSJunchao Zhang /*@C 463021e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 463121e72a00SBarry Smith 463221e72a00SBarry Smith Not Collective 463321e72a00SBarry Smith 463421e72a00SBarry Smith Input Parameter: 4635fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 463621e72a00SBarry Smith 463721e72a00SBarry Smith Output Parameter: 463821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 463921e72a00SBarry Smith 464021e72a00SBarry Smith Level: intermediate 464121e72a00SBarry Smith 46421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 464321e72a00SBarry Smith @*/ 4644d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4645d71ae5a4SJacob Faibussowitsch { 464621e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 464721e72a00SBarry Smith 464821e72a00SBarry Smith PetscFunctionBegin; 464921e72a00SBarry Smith *nz = aij->rmax; 46503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 465121e72a00SBarry Smith } 465221e72a00SBarry Smith 46532c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46542c4ab24aSJunchao Zhang { 46552c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46562c4ab24aSJunchao Zhang PetscFunctionBegin; 46572c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46582c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46592c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46602c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46612c4ab24aSJunchao Zhang } 46622c4ab24aSJunchao Zhang 4663d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4664d71ae5a4SJacob Faibussowitsch { 4665394ed5ebSJunchao Zhang MPI_Comm comm; 4666394ed5ebSJunchao Zhang PetscInt *i, *j; 46670d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4668394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4669394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4670394ed5ebSJunchao Zhang PetscInt *Aj; 4671394ed5ebSJunchao Zhang PetscScalar *Aa; 4672cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4673cbc6b225SStefano Zampini MatType rtype; 4674394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46752c4ab24aSJunchao Zhang PetscContainer container; 46762c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46770d88f7f4SJunchao Zhang PetscBool isorted; 4678394ed5ebSJunchao Zhang 4679394ed5ebSJunchao Zhang PetscFunctionBegin; 46809566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46819566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4682e8729f6fSJunchao Zhang i = coo_i; 4683e8729f6fSJunchao Zhang j = coo_j; 46849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46850d88f7f4SJunchao Zhang 46860d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46870d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46880d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46890d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4690394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46910d88f7f4SJunchao Zhang if (isorted) { 46920d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46930d88f7f4SJunchao Zhang else iprev = i[k]; 46940d88f7f4SJunchao Zhang } 4695394ed5ebSJunchao Zhang perm[k] = k; 4696394ed5ebSJunchao Zhang } 4697394ed5ebSJunchao Zhang 46980d88f7f4SJunchao Zhang /* Sort by row if not already */ 46990d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4700651b1cf9SStefano Zampini 4701651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4702651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 47039371c9d4SSatish Balay if (i[k] >= 0) break; 4704394ed5ebSJunchao Zhang nneg = k; 47059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4706394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 470735cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4708394ed5ebSJunchao Zhang 47099566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 47109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4711394ed5ebSJunchao Zhang 4712651b1cf9SStefano Zampini /* Support for HYPRE */ 4713651b1cf9SStefano Zampini PetscBool hypre; 4714651b1cf9SStefano Zampini const char *name; 4715651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4716651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4717651b1cf9SStefano Zampini 4718394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 471935cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4720394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4721394ed5ebSJunchao Zhang while (k < coo_n) { 47220d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47230d88f7f4SJunchao Zhang PetscInt jprev; 47240d88f7f4SJunchao Zhang 47250d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4726394ed5ebSJunchao Zhang row = i[k]; 47270d88f7f4SJunchao Zhang start = k; 47280d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47290d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47300d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47310d88f7f4SJunchao Zhang if (strictly_sorted) { 47320d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47330d88f7f4SJunchao Zhang else jprev = j[k]; 47340d88f7f4SJunchao Zhang } 47350d88f7f4SJunchao Zhang k++; 47360d88f7f4SJunchao Zhang } 4737394ed5ebSJunchao Zhang end = k; 47380d88f7f4SJunchao Zhang 4739651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4740651b1cf9SStefano Zampini if (hypre) { 4741651b1cf9SStefano Zampini PetscInt minj = PETSC_MAX_INT; 4742651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47430d88f7f4SJunchao Zhang 47440d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47450d88f7f4SJunchao Zhang PetscCount tmp; 47460d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47470d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47480d88f7f4SJunchao Zhang j[p] = j[start]; 47490d88f7f4SJunchao Zhang j[start] = row; 47500d88f7f4SJunchao Zhang tmp = perm[start]; 47510d88f7f4SJunchao Zhang perm[start] = perm[p]; 47520d88f7f4SJunchao Zhang perm[p] = tmp; 47530d88f7f4SJunchao Zhang break; 47540d88f7f4SJunchao Zhang } 47550d88f7f4SJunchao Zhang } 47560d88f7f4SJunchao Zhang } else { 4757651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4758651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4759651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4760651b1cf9SStefano Zampini } 47610d88f7f4SJunchao Zhang 4762651b1cf9SStefano Zampini if (hasdiag) { 4763651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4764651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4765651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4766651b1cf9SStefano Zampini } 4767651b1cf9SStefano Zampini } 4768651b1cf9SStefano Zampini } 47690d88f7f4SJunchao Zhang } 47700d88f7f4SJunchao Zhang // sort by columns in a row 47710d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4772651b1cf9SStefano Zampini 47730d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47740d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47750d88f7f4SJunchao Zhang Aj[q] = j[p]; 47760d88f7f4SJunchao Zhang jmap[q] = 1; 47770d88f7f4SJunchao Zhang } 47780d88f7f4SJunchao Zhang Ai[row] = end - start; 47790d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47800d88f7f4SJunchao Zhang } else { 4781394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4782394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4783651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4784394ed5ebSJunchao Zhang Ai[row] = 1; 4785394ed5ebSJunchao Zhang nnz++; 4786394ed5ebSJunchao Zhang 4787394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4788394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4789394ed5ebSJunchao Zhang q++; 4790394ed5ebSJunchao Zhang jmap[q] = 1; 4791394ed5ebSJunchao Zhang Aj[q] = j[p]; 4792394ed5ebSJunchao Zhang Ai[row]++; 4793394ed5ebSJunchao Zhang nnz++; 4794394ed5ebSJunchao Zhang } else { 4795394ed5ebSJunchao Zhang jmap[q]++; 4796394ed5ebSJunchao Zhang } 4797394ed5ebSJunchao Zhang } 4798394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4799394ed5ebSJunchao Zhang } 48000d88f7f4SJunchao Zhang } 48010d88f7f4SJunchao Zhang 4802394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4803394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 48040d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4805394ed5ebSJunchao Zhang jmap[0] = 0; 4806394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 48070d88f7f4SJunchao Zhang 4808394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4809394ed5ebSJunchao Zhang PetscCount *jmap_new; 4810394ed5ebSJunchao Zhang PetscInt *Aj_new; 4811394ed5ebSJunchao Zhang 48129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 48139566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 48149566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4815394ed5ebSJunchao Zhang jmap = jmap_new; 4816394ed5ebSJunchao Zhang 48179566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 48189566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 48199566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4820394ed5ebSJunchao Zhang Aj = Aj_new; 4821394ed5ebSJunchao Zhang } 4822394ed5ebSJunchao Zhang 4823394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4824394ed5ebSJunchao Zhang PetscCount *perm_new; 4825cbc6b225SStefano Zampini 48269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48289566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4829394ed5ebSJunchao Zhang perm = perm_new; 4830394ed5ebSJunchao Zhang } 4831394ed5ebSJunchao Zhang 48329566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 48349566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4835394ed5ebSJunchao Zhang 4836394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4837394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48382c4ab24aSJunchao Zhang 48392c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48402c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48412c4ab24aSJunchao Zhang coo->nz = nnz; 48422c4ab24aSJunchao Zhang coo->n = coo_n; 48432c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48442c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48452c4ab24aSJunchao Zhang coo->perm = perm; 48462c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 48472c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 48482c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 48492c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 48502c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 48513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4852394ed5ebSJunchao Zhang } 4853394ed5ebSJunchao Zhang 4854d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4855d71ae5a4SJacob Faibussowitsch { 4856394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4857394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48582c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4859394ed5ebSJunchao Zhang PetscScalar *Aa; 48602c4ab24aSJunchao Zhang PetscContainer container; 48612c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4862394ed5ebSJunchao Zhang 4863394ed5ebSJunchao Zhang PetscFunctionBegin; 48642c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48652c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48662c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48672c4ab24aSJunchao Zhang perm = coo->perm; 48682c4ab24aSJunchao Zhang jmap = coo->jmap; 48699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4870394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4871b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4872b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4873b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4874394ed5ebSJunchao Zhang } 48759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4877394ed5ebSJunchao Zhang } 4878394ed5ebSJunchao Zhang 487934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48805063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 488102fe1965SBarry Smith #endif 4882d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4883d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4884d5e393b6SSuyash Tandon #endif 48853d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48865063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48873d0639e7SStefano Zampini #endif 488802fe1965SBarry Smith 4889d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4890d71ae5a4SJacob Faibussowitsch { 4891273d9f13SBarry Smith Mat_SeqAIJ *b; 489238baddfdSBarry Smith PetscMPIInt size; 4893273d9f13SBarry Smith 4894273d9f13SBarry Smith PetscFunctionBegin; 48959566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 489608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4897273d9f13SBarry Smith 48984dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48992205254eSKarl Rupp 4900b0a32e0cSBarry Smith B->data = (void *)b; 4901aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4902071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 49032205254eSKarl Rupp 4904f4259b30SLisandro Dalcin b->row = NULL; 4905f4259b30SLisandro Dalcin b->col = NULL; 4906f4259b30SLisandro Dalcin b->icol = NULL; 4907b810aeb4SBarry Smith b->reallocs = 0; 490836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4909f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4910416022c9SBarry Smith b->nonew = 0; 4911f4259b30SLisandro Dalcin b->diag = NULL; 4912f4259b30SLisandro Dalcin b->solve_work = NULL; 4913f4259b30SLisandro Dalcin B->spptr = NULL; 4914f4259b30SLisandro Dalcin b->saved_values = NULL; 4915f4259b30SLisandro Dalcin b->idiag = NULL; 4916f4259b30SLisandro Dalcin b->mdiag = NULL; 4917f4259b30SLisandro Dalcin b->ssor_work = NULL; 491871f1c65dSBarry Smith b->omega = 1.0; 491971f1c65dSBarry Smith b->fshift = 0.0; 492071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4921bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4922a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 492317ab2063SBarry Smith 49249566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4925d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 49269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4928b3866ffcSBarry Smith #endif 49299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49319566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49369779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4938191b95cbSRichard Tran Mills #endif 493934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 494302fe1965SBarry Smith #endif 4944d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4945d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4946d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4947d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4948d5e393b6SSuyash Tandon #endif 49493d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49513d0639e7SStefano Zampini #endif 49529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4953af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4955af8000cdSHong Zhang #endif 4956d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4958d24d4204SJose E. Roman #endif 495963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 496263c07aadSStefano Zampini #endif 49639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 496714e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 49709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49789566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49799566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 498217ab2063SBarry Smith } 498317ab2063SBarry Smith 4984b24902e0SBarry Smith /* 49853893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4986b24902e0SBarry Smith */ 4987d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4988d71ae5a4SJacob Faibussowitsch { 49892a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4990071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 499117ab2063SBarry Smith 49923a40ed3dSBarry Smith PetscFunctionBegin; 4993aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4994273d9f13SBarry Smith 4995d5f3da31SBarry Smith C->factortype = A->factortype; 4996f4259b30SLisandro Dalcin c->row = NULL; 4997f4259b30SLisandro Dalcin c->col = NULL; 4998f4259b30SLisandro Dalcin c->icol = NULL; 49996ad4291fSHong Zhang c->reallocs = 0; 5000bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 500117ab2063SBarry Smith 500269272f91SPierre Jolivet C->assembled = A->assembled; 500317ab2063SBarry Smith 500469272f91SPierre Jolivet if (A->preallocated) { 50059566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 50069566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 5007eec197d1SBarry Smith 500831fe6a7dSBarry Smith if (!A->hash_active) { 50099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 50109566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 50119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 50129566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 501317ab2063SBarry Smith 501417ab2063SBarry Smith /* allocate the matrix space */ 5015f77e22a1SHong Zhang if (mallocmatspace) { 50169566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 50172205254eSKarl Rupp 5018f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 50192205254eSKarl Rupp 50209566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 502117ab2063SBarry Smith if (m > 0) { 50229566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 5023be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 50242e5835c6SStefano Zampini const PetscScalar *aa; 50252e5835c6SStefano Zampini 50269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50279566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5029be6bf707SBarry Smith } else { 50309566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 503117ab2063SBarry Smith } 503208480c60SBarry Smith } 5033f77e22a1SHong Zhang } 503431fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 503531fe6a7dSBarry Smith } else { 503631fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 503731fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 503831fe6a7dSBarry Smith } 503917ab2063SBarry Smith 50406ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5041416022c9SBarry Smith c->roworiented = a->roworiented; 5042416022c9SBarry Smith c->nonew = a->nonew; 5043416022c9SBarry Smith if (a->diag) { 50449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50459566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5046071fcb05SBarry Smith } else c->diag = NULL; 50472205254eSKarl Rupp 5048f4259b30SLisandro Dalcin c->solve_work = NULL; 5049f4259b30SLisandro Dalcin c->saved_values = NULL; 5050f4259b30SLisandro Dalcin c->idiag = NULL; 5051f4259b30SLisandro Dalcin c->ssor_work = NULL; 5052a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 5053e6b907acSBarry Smith c->free_a = PETSC_TRUE; 5054e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 50556ad4291fSHong Zhang 5056893ad86cSHong Zhang c->rmax = a->rmax; 5057416022c9SBarry Smith c->nz = a->nz; 50588ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5059754ec7b1SSatish Balay 50606ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50616ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5062cd6b891eSBarry Smith if (a->compressedrow.use) { 50636ad4291fSHong Zhang i = a->compressedrow.nrows; 50649566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50659566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50669566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 506727ea64f8SHong Zhang } else { 506827ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50690298fd71SBarry Smith c->compressedrow.i = NULL; 50700298fd71SBarry Smith c->compressedrow.rindex = NULL; 50716ad4291fSHong Zhang } 5072ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5073e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50744846f1f5SKris Buschelman 50759566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 507669272f91SPierre Jolivet } 50779566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 507917ab2063SBarry Smith } 508017ab2063SBarry Smith 5081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5082d71ae5a4SJacob Faibussowitsch { 5083b24902e0SBarry Smith PetscFunctionBegin; 50849566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50859566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 508648a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50879566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50889566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5090b24902e0SBarry Smith } 5091b24902e0SBarry Smith 5092d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5093d71ae5a4SJacob Faibussowitsch { 509452f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 509552f91c60SVaclav Hapla 509652f91c60SVaclav Hapla PetscFunctionBegin; 509752f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 509852f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5099c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 51009566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 51019566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 51029566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 510352f91c60SVaclav Hapla if (isbinary) { 51049566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 510552f91c60SVaclav Hapla } else if (ishdf5) { 510652f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 51079566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 510852f91c60SVaclav Hapla #else 510952f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 511052f91c60SVaclav Hapla #endif 511152f91c60SVaclav Hapla } else { 511298921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 511352f91c60SVaclav Hapla } 51143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 511552f91c60SVaclav Hapla } 511652f91c60SVaclav Hapla 5117d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5118d71ae5a4SJacob Faibussowitsch { 51193ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 51203ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5121fbdbba38SShri Abhyankar 5122fbdbba38SShri Abhyankar PetscFunctionBegin; 51239566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5124bbead8a2SBarry Smith 51253ea6fe3dSLisandro Dalcin /* read in matrix header */ 51269566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 512708401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51289371c9d4SSatish Balay M = header[1]; 51299371c9d4SSatish Balay N = header[2]; 51309371c9d4SSatish Balay nz = header[3]; 513108401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 513208401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 513308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5134fbdbba38SShri Abhyankar 51353ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51369566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51373ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51383ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51393ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51403ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51413ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51429566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51443ea6fe3dSLisandro Dalcin 51453ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51469566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5147aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51483ea6fe3dSLisandro Dalcin 5149fbdbba38SShri Abhyankar /* read in row lengths */ 51509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51519566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51523ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51539371c9d4SSatish Balay sum = 0; 51549371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 515508401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51563ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51589566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5159aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51603ea6fe3dSLisandro Dalcin /* store row lengths */ 51619566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51629566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5163fbdbba38SShri Abhyankar 51643ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51659371c9d4SSatish Balay a->i[0] = 0; 51669371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51673ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51689566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51693ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51709566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5171fbdbba38SShri Abhyankar 51729566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51739566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5175fbdbba38SShri Abhyankar } 5176fbdbba38SShri Abhyankar 5177d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5178d71ae5a4SJacob Faibussowitsch { 51797264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5180fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5181eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5182eeffb40dSHong Zhang PetscInt k; 5183eeffb40dSHong Zhang #endif 51847264ac53SSatish Balay 51853a40ed3dSBarry Smith PetscFunctionBegin; 5186bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5187d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5188ca44d042SBarry Smith *flg = PETSC_FALSE; 51893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5190bcd2baecSBarry Smith } 51917264ac53SSatish Balay 51927264ac53SSatish Balay /* if the a->i are the same */ 51939566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51943ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51957264ac53SSatish Balay 51967264ac53SSatish Balay /* if a->j are the same */ 51979566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51983ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5199bcd2baecSBarry Smith 52009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 52019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5202bcd2baecSBarry Smith /* if a->a are the same */ 5203eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5204eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5205fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5206eeffb40dSHong Zhang *flg = PETSC_FALSE; 52073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5208eeffb40dSHong Zhang } 5209eeffb40dSHong Zhang } 5210eeffb40dSHong Zhang #else 52119566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5212eeffb40dSHong Zhang #endif 52139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 52149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 52153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52167264ac53SSatish Balay } 521736db0b34SBarry Smith 521805869f15SSatish Balay /*@ 521911a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 522036db0b34SBarry Smith provided by the user. 522136db0b34SBarry Smith 5222d083f849SBarry Smith Collective 522336db0b34SBarry Smith 522436db0b34SBarry Smith Input Parameters: 522536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 522636db0b34SBarry Smith . m - number of rows 522736db0b34SBarry Smith . n - number of columns 5228483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 522936db0b34SBarry Smith . j - column indices 523036db0b34SBarry Smith - a - matrix values 523136db0b34SBarry Smith 523236db0b34SBarry Smith Output Parameter: 523336db0b34SBarry Smith . mat - the matrix 523436db0b34SBarry Smith 523536db0b34SBarry Smith Level: intermediate 523636db0b34SBarry Smith 523736db0b34SBarry Smith Notes: 52382ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5239292fb18eSBarry Smith once the matrix is destroyed and not before 524036db0b34SBarry Smith 524136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 524236db0b34SBarry Smith 52432ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 524436db0b34SBarry Smith 5245a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5246a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52478eef79e4SBarry Smith as shown 52482ef1f0ffSBarry Smith .vb 52492ef1f0ffSBarry Smith 1 0 0 52502ef1f0ffSBarry Smith 2 0 3 52512ef1f0ffSBarry Smith 4 5 6 5252a4552177SSatish Balay 52532ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52542ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52552ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52562ef1f0ffSBarry Smith .ve 5257a4552177SSatish Balay 52581cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 525936db0b34SBarry Smith @*/ 5260d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5261d71ae5a4SJacob Faibussowitsch { 5262cbcfb4deSHong Zhang PetscInt ii; 526336db0b34SBarry Smith Mat_SeqAIJ *aij; 5264cbcfb4deSHong Zhang PetscInt jj; 526536db0b34SBarry Smith 526636db0b34SBarry Smith PetscFunctionBegin; 5267aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52689566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52699566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52709566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52719566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5273ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52749566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5276ab93d7beSBarry Smith 527736db0b34SBarry Smith aij->i = i; 527836db0b34SBarry Smith aij->j = j; 527936db0b34SBarry Smith aij->a = a; 528036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 528136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5282e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5283e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 528436db0b34SBarry Smith 5285cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 528636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 528776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5288aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52899985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 529008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 529108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52929985e31cSBarry Smith } 529336db0b34SBarry Smith } 529476bd3646SJed Brown } 529576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 529636db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 529708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5298aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 529936db0b34SBarry Smith } 530076bd3646SJed Brown } 530136db0b34SBarry Smith 53029566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53039566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 530536db0b34SBarry Smith } 5306cbc6b225SStefano Zampini 5307f62e3866SBarry Smith /*@ 530811a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 53098a0b0e6bSVictor Minden provided by the user. 53108a0b0e6bSVictor Minden 5311d083f849SBarry Smith Collective 53128a0b0e6bSVictor Minden 53138a0b0e6bSVictor Minden Input Parameters: 53148a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 53158a0b0e6bSVictor Minden . m - number of rows 53168a0b0e6bSVictor Minden . n - number of columns 53178a0b0e6bSVictor Minden . i - row indices 53188a0b0e6bSVictor Minden . j - column indices 53191230e6d1SVictor Minden . a - matrix values 53201230e6d1SVictor Minden . nz - number of nonzeros 53212ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 53228a0b0e6bSVictor Minden 53238a0b0e6bSVictor Minden Output Parameter: 53248a0b0e6bSVictor Minden . mat - the matrix 53258a0b0e6bSVictor Minden 53268a0b0e6bSVictor Minden Level: intermediate 53278a0b0e6bSVictor Minden 5328f62e3866SBarry Smith Example: 5329f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53309e99939fSJunchao Zhang .vb 53318a0b0e6bSVictor Minden 1 0 0 53328a0b0e6bSVictor Minden 2 0 3 53338a0b0e6bSVictor Minden 4 5 6 53348a0b0e6bSVictor Minden 53358a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53368a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53378a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53389e99939fSJunchao Zhang .ve 5339fe59aa6dSJacob Faibussowitsch 53402ef1f0ffSBarry Smith Note: 5341d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5342d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53438a0b0e6bSVictor Minden 53441cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53458a0b0e6bSVictor Minden @*/ 5346d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5347d71ae5a4SJacob Faibussowitsch { 5348d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53498a0b0e6bSVictor Minden 53508a0b0e6bSVictor Minden PetscFunctionBegin; 53519566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5352ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53539566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53549566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53559566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53571230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53581230e6d1SVictor Minden if (idx) { 53591230e6d1SVictor Minden row = i[ii] - 1; 53601230e6d1SVictor Minden col = j[ii] - 1; 53611230e6d1SVictor Minden } else { 53621230e6d1SVictor Minden row = i[ii]; 53631230e6d1SVictor Minden col = j[ii]; 53648a0b0e6bSVictor Minden } 53659566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53668a0b0e6bSVictor Minden } 53679566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53689566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53699566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53718a0b0e6bSVictor Minden } 537236db0b34SBarry Smith 5373d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5374d71ae5a4SJacob Faibussowitsch { 5375acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5376acf2f550SJed Brown 5377acf2f550SJed Brown PetscFunctionBegin; 5378acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5379acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53802205254eSKarl Rupp 53819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5383acf2f550SJed Brown } 5384acf2f550SJed Brown 5385d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5386d71ae5a4SJacob Faibussowitsch { 53879c8f2541SHong Zhang PetscFunctionBegin; 53889566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53909c8f2541SHong Zhang } 53919c8f2541SHong Zhang 539281824310SBarry Smith /* 539353dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 539453dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 539553dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 539653dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 539753dd7562SDmitry Karpeev */ 5398d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5399d71ae5a4SJacob Faibussowitsch { 540053dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 540153dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 540253dd7562SDmitry Karpeev PetscBool seqaij; 540353dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 540453dd7562SDmitry Karpeev PetscScalar v; 540553dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 540653dd7562SDmitry Karpeev 540753dd7562SDmitry Karpeev PetscFunctionBegin; 54083ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 540953dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 54109566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 541128b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 541253dd7562SDmitry Karpeev if (rowemb) { 54139566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 541408401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 541553dd7562SDmitry Karpeev } else { 541608401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 541753dd7562SDmitry Karpeev } 541853dd7562SDmitry Karpeev if (colemb) { 54199566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 542008401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 542153dd7562SDmitry Karpeev } else { 542208401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 542353dd7562SDmitry Karpeev } 542453dd7562SDmitry Karpeev 542553dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 542653dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 54279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5428ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54309566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 543153dd7562SDmitry Karpeev } 543248a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 543353dd7562SDmitry Karpeev count = 0; 543453dd7562SDmitry Karpeev rowindices = NULL; 543553dd7562SDmitry Karpeev colindices = NULL; 543648a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 543748a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 543853dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 543953dd7562SDmitry Karpeev PetscInt row; 544053dd7562SDmitry Karpeev row = i; 544153dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 544253dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 544353dd7562SDmitry Karpeev PetscInt col; 544453dd7562SDmitry Karpeev col = Baij->j[count]; 544553dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 544653dd7562SDmitry Karpeev v = Baij->a[count]; 54479566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 544853dd7562SDmitry Karpeev ++count; 544953dd7562SDmitry Karpeev } 545053dd7562SDmitry Karpeev } 545153dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 545253dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 545353dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 545453dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 545553dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 545753dd7562SDmitry Karpeev } 545853dd7562SDmitry Karpeev 545958c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5460dec0b466SHong Zhang { 5461dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5462dec0b466SHong Zhang MatScalar *aa = a->a; 5463dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5464dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5465dec0b466SHong Zhang 5466dec0b466SHong Zhang PetscFunctionBegin; 5467dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5468dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5469dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5470dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5471dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 547258c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5473dec0b466SHong Zhang else { 5474dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5475dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5476dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5477dec0b466SHong Zhang } 5478dec0b466SHong Zhang } 5479dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5480dec0b466SHong Zhang fshift_prev = fshift; 5481dec0b466SHong Zhang /* reset ilen and imax for each row */ 5482dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5483dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5484dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5485dec0b466SHong Zhang } 5486312eded4SPierre Jolivet if (fshift) { 5487dec0b466SHong Zhang if (m) { 5488dec0b466SHong Zhang ai[m] -= fshift; 5489dec0b466SHong Zhang a->nz = ai[m]; 5490dec0b466SHong Zhang } 5491dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5492312eded4SPierre Jolivet A->nonzerostate++; 5493dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5494dec0b466SHong Zhang a->rmax = rmax; 5495dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5496dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5497dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5498312eded4SPierre Jolivet } 54993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5500dec0b466SHong Zhang } 5501dec0b466SHong Zhang 55024099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 55034099cc6bSBarry Smith 55044099cc6bSBarry Smith /*@C 550511a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 55064099cc6bSBarry Smith 5507c3339decSBarry Smith Collective 55084099cc6bSBarry Smith 55094099cc6bSBarry Smith Input Parameters: 55104099cc6bSBarry Smith + mat - the matrix object 55114099cc6bSBarry Smith - matype - matrix type 55124099cc6bSBarry Smith 55134099cc6bSBarry Smith Options Database Key: 55144e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 55154099cc6bSBarry Smith 55164099cc6bSBarry Smith Level: intermediate 55174099cc6bSBarry Smith 5518fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 55194099cc6bSBarry Smith @*/ 5520d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5521d71ae5a4SJacob Faibussowitsch { 55224099cc6bSBarry Smith PetscBool sametype; 55235f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 55244099cc6bSBarry Smith 55254099cc6bSBarry Smith PetscFunctionBegin; 55264099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 55279566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55283ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55294099cc6bSBarry Smith 55309566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55316adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55329566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55344099cc6bSBarry Smith } 55354099cc6bSBarry Smith 55364099cc6bSBarry Smith /*@C 553711a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55384099cc6bSBarry Smith 55394099cc6bSBarry Smith Not Collective 55404099cc6bSBarry Smith 55414099cc6bSBarry Smith Input Parameters: 5542fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55434099cc6bSBarry Smith - function - routine to convert to subtype 55444099cc6bSBarry Smith 55452ef1f0ffSBarry Smith Level: advanced 55462ef1f0ffSBarry Smith 55474099cc6bSBarry Smith Notes: 554811a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55494099cc6bSBarry Smith 55504099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55514099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55524099cc6bSBarry Smith 55531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55544099cc6bSBarry Smith @*/ 5555d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5556d71ae5a4SJacob Faibussowitsch { 55574099cc6bSBarry Smith PetscFunctionBegin; 55589566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55599566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55614099cc6bSBarry Smith } 55624099cc6bSBarry Smith 55634099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55644099cc6bSBarry Smith 55654099cc6bSBarry Smith /*@C 556611a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55674099cc6bSBarry Smith 55684099cc6bSBarry Smith Not Collective 55694099cc6bSBarry Smith 55704099cc6bSBarry Smith Level: advanced 55714099cc6bSBarry Smith 55722ef1f0ffSBarry Smith Note: 55732ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55742ef1f0ffSBarry Smith 55751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55764099cc6bSBarry Smith @*/ 5577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5578d71ae5a4SJacob Faibussowitsch { 55794099cc6bSBarry Smith PetscFunctionBegin; 55803ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55814099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55824099cc6bSBarry Smith 55839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55869779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5588485f9817SRichard Tran Mills #endif 55895063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55915063d097SStefano Zampini #endif 5592d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5593d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5594d5e393b6SSuyash Tandon #endif 55955063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55975063d097SStefano Zampini #endif 55984099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 56004099cc6bSBarry Smith #endif 56013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56024099cc6bSBarry Smith } 560353dd7562SDmitry Karpeev 560453dd7562SDmitry Karpeev /* 560581824310SBarry Smith Special version for direct calls from Fortran 560681824310SBarry Smith */ 5607af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 560881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 560981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 561081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 561181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 561281824310SBarry Smith #endif 561381824310SBarry Smith 561481824310SBarry Smith /* Change these macros so can be used in void function */ 561598921bdaSJacob Faibussowitsch 561698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 56179566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 56189566063dSJacob Faibussowitsch #undef PetscCall 56199371c9d4SSatish Balay #define PetscCall(...) \ 56209371c9d4SSatish Balay do { \ 56215f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 562298921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 562398921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 562498921bdaSJacob Faibussowitsch return; \ 562598921bdaSJacob Faibussowitsch } \ 562698921bdaSJacob Faibussowitsch } while (0) 562798921bdaSJacob Faibussowitsch 562898921bdaSJacob Faibussowitsch #undef SETERRQ 56299371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56309371c9d4SSatish Balay do { \ 563198921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 563298921bdaSJacob Faibussowitsch return; \ 563398921bdaSJacob Faibussowitsch } while (0) 563481824310SBarry Smith 5635d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5636d71ae5a4SJacob Faibussowitsch { 563781824310SBarry Smith Mat A = *AA; 563881824310SBarry Smith PetscInt m = *mm, n = *nn; 563981824310SBarry Smith InsertMode is = *isis; 564081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 564181824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 564281824310SBarry Smith PetscInt *imax, *ai, *ailen; 564381824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 564454f21887SBarry Smith MatScalar *ap, value, *aa; 5645ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5646ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 564781824310SBarry Smith 564881824310SBarry Smith PetscFunctionBegin; 56494994cf47SJed Brown MatCheckPreallocated(A, 1); 565081824310SBarry Smith imax = a->imax; 565181824310SBarry Smith ai = a->i; 565281824310SBarry Smith ailen = a->ilen; 565381824310SBarry Smith aj = a->j; 565481824310SBarry Smith aa = a->a; 565581824310SBarry Smith 565681824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 565781824310SBarry Smith row = im[k]; 565881824310SBarry Smith if (row < 0) continue; 56595f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56609371c9d4SSatish Balay rp = aj + ai[row]; 56619371c9d4SSatish Balay ap = aa + ai[row]; 56629371c9d4SSatish Balay rmax = imax[row]; 56639371c9d4SSatish Balay nrow = ailen[row]; 566481824310SBarry Smith low = 0; 566581824310SBarry Smith high = nrow; 566681824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 566781824310SBarry Smith if (in[l] < 0) continue; 56685f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 566981824310SBarry Smith col = in[l]; 56702205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56712205254eSKarl Rupp else value = v[k + l * m]; 56722205254eSKarl Rupp 567381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 567481824310SBarry Smith 56752205254eSKarl Rupp if (col <= lastcol) low = 0; 56762205254eSKarl Rupp else high = nrow; 567781824310SBarry Smith lastcol = col; 567881824310SBarry Smith while (high - low > 5) { 567981824310SBarry Smith t = (low + high) / 2; 568081824310SBarry Smith if (rp[t] > col) high = t; 568181824310SBarry Smith else low = t; 568281824310SBarry Smith } 568381824310SBarry Smith for (i = low; i < high; i++) { 568481824310SBarry Smith if (rp[i] > col) break; 568581824310SBarry Smith if (rp[i] == col) { 568681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 568781824310SBarry Smith else ap[i] = value; 568881824310SBarry Smith goto noinsert; 568981824310SBarry Smith } 569081824310SBarry Smith } 569181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 569281824310SBarry Smith if (nonew == 1) goto noinsert; 56935f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5694fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56959371c9d4SSatish Balay N = nrow++ - 1; 56969371c9d4SSatish Balay a->nz++; 56979371c9d4SSatish Balay high++; 569881824310SBarry Smith /* shift up all the later entries in this row */ 569981824310SBarry Smith for (ii = N; ii >= i; ii--) { 570081824310SBarry Smith rp[ii + 1] = rp[ii]; 570181824310SBarry Smith ap[ii + 1] = ap[ii]; 570281824310SBarry Smith } 570381824310SBarry Smith rp[i] = col; 570481824310SBarry Smith ap[i] = value; 5705e56f5c9eSBarry Smith A->nonzerostate++; 570681824310SBarry Smith noinsert:; 570781824310SBarry Smith low = i + 1; 570881824310SBarry Smith } 570981824310SBarry Smith ailen[row] = nrow; 571081824310SBarry Smith } 571181824310SBarry Smith PetscFunctionReturnVoid(); 571281824310SBarry Smith } 571398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 571498921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 571598921bdaSJacob Faibussowitsch * original definitions */ 57169566063dSJacob Faibussowitsch #undef PetscCall 571798921bdaSJacob Faibussowitsch #undef SETERRQ 5718