1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 54719b08ed1SBarry Smith if (A->structure_only) { 5489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55019b08ed1SBarry Smith } else { 5519566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55219b08ed1SBarry Smith } 55319b08ed1SBarry Smith a->i[0] = 0; 55419b08ed1SBarry Smith if (A->structure_only) { 55519b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55619b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55719b08ed1SBarry Smith } else { 55819b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 55919b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56219b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56319b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56519b08ed1SBarry Smith } 56619b08ed1SBarry Smith 567ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 568d71ae5a4SJacob Faibussowitsch { 569071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 570071fcb05SBarry Smith PetscInt *rp, k, row; 571071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 572071fcb05SBarry Smith PetscInt *aj = a->j; 573fff043a9SJunchao Zhang MatScalar *aa, *ap; 574071fcb05SBarry Smith 575071fcb05SBarry Smith PetscFunctionBegin; 5769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 577071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 578071fcb05SBarry Smith row = im[k]; 5796bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 580071fcb05SBarry Smith rp = aj + ai[row]; 581071fcb05SBarry Smith ap = aa + ai[row]; 58248a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 583071fcb05SBarry Smith if (!A->structure_only) { 584071fcb05SBarry Smith if (v) { 5859566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 586071fcb05SBarry Smith v += n; 587071fcb05SBarry Smith } else { 5889566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 589071fcb05SBarry Smith } 590071fcb05SBarry Smith } 591071fcb05SBarry Smith ailen[row] = n; 592071fcb05SBarry Smith a->nz += n; 593071fcb05SBarry Smith } 5949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 596071fcb05SBarry Smith } 597071fcb05SBarry Smith 598ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 599d71ae5a4SJacob Faibussowitsch { 6007eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60197f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60297f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6034e208921SJed Brown const MatScalar *ap, *aa; 6047eb43aa7SLois Curfman McInnes 6053a40ed3dSBarry Smith PetscFunctionBegin; 6064e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6077eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6087eb43aa7SLois Curfman McInnes row = im[k]; 6099371c9d4SSatish Balay if (row < 0) { 6109371c9d4SSatish Balay v += n; 6119371c9d4SSatish Balay continue; 6129371c9d4SSatish Balay } /* negative row */ 61354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6148e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6158e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6167eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6177eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6189371c9d4SSatish Balay if (in[l] < 0) { 6199371c9d4SSatish Balay v++; 6209371c9d4SSatish Balay continue; 6219371c9d4SSatish Balay } /* negative column */ 62254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 623bfeeae90SHong Zhang col = in[l]; 6249371c9d4SSatish Balay high = nrow; 6259371c9d4SSatish Balay low = 0; /* assume unsorted */ 6267eb43aa7SLois Curfman McInnes while (high - low > 5) { 6277eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6287eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6297eb43aa7SLois Curfman McInnes else low = t; 6307eb43aa7SLois Curfman McInnes } 6317eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6327eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6337eb43aa7SLois Curfman McInnes if (rp[i] == col) { 634b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6357eb43aa7SLois Curfman McInnes goto finished; 6367eb43aa7SLois Curfman McInnes } 6377eb43aa7SLois Curfman McInnes } 63897e567efSBarry Smith *v++ = 0.0; 6397eb43aa7SLois Curfman McInnes finished:; 6407eb43aa7SLois Curfman McInnes } 6417eb43aa7SLois Curfman McInnes } 6424e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6447eb43aa7SLois Curfman McInnes } 6457eb43aa7SLois Curfman McInnes 646ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 647d71ae5a4SJacob Faibussowitsch { 6483ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 649c898d852SStefano Zampini const PetscScalar *av; 6503ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6513ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65217ab2063SBarry Smith 6533a40ed3dSBarry Smith PetscFunctionBegin; 6549566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6552205254eSKarl Rupp 6563ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6573ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6583ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6593ea6fe3dSLisandro Dalcin nz = A->nz; 660416022c9SBarry Smith 6613ea6fe3dSLisandro Dalcin /* write matrix header */ 6623ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6639371c9d4SSatish Balay header[1] = M; 6649371c9d4SSatish Balay header[2] = N; 6659371c9d4SSatish Balay header[3] = nz; 6669566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 667416022c9SBarry Smith 6683ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6703ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6729566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6733ea6fe3dSLisandro Dalcin /* store column indices */ 6749566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 675416022c9SBarry Smith /* store nonzero values */ 6769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6779566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 679b37d52dbSMark F. Adams 6803ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6819566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68317ab2063SBarry Smith } 684416022c9SBarry Smith 685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 686d71ae5a4SJacob Faibussowitsch { 6877dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6887dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6897dc0baabSHong Zhang 6907dc0baabSHong Zhang PetscFunctionBegin; 6919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6927dc0baabSHong Zhang for (i = 0; i < m; i++) { 6939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69448a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6967dc0baabSHong Zhang } 6979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6997dc0baabSHong Zhang } 7007dc0baabSHong Zhang 70109573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 702cd155464SBarry Smith 703ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 704d71ae5a4SJacob Faibussowitsch { 705416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 706c898d852SStefano Zampini const PetscScalar *av; 70760e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 708e060cb09SBarry Smith const char *name; 709f3ef73ceSBarry Smith PetscViewerFormat format; 71017ab2063SBarry Smith 7113a40ed3dSBarry Smith PetscFunctionBegin; 7127dc0baabSHong Zhang if (A->structure_only) { 7139566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7157dc0baabSHong Zhang } 71643e49210SHong Zhang 7179566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7183ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7192e5835c6SStefano Zampini 720c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72371c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72497f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72560e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 726c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 727d00d2cf4SBarry Smith nofinalvalue = 1; 728d00d2cf4SBarry Smith } 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 732fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 734fbfe6fa7SJed Brown #else 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #endif 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73817ab2063SBarry Smith 73917ab2063SBarry Smith for (i = 0; i < m; i++) { 74060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 741aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74317ab2063SBarry Smith #else 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74517ab2063SBarry Smith #endif 74617ab2063SBarry Smith } 74717ab2063SBarry Smith } 748d00d2cf4SBarry Smith if (nofinalvalue) { 749c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 751c337ccceSJed Brown #else 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 753c337ccceSJed Brown #endif 754d00d2cf4SBarry Smith } 7559566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 758fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76044cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 763aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7706831982aSBarry Smith } 77144cd7ae7SLois Curfman McInnes #else 7729566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77344cd7ae7SLois Curfman McInnes #endif 77444cd7ae7SLois Curfman McInnes } 7759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 778fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77997f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 782496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 783496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 785496be53dSLois Curfman McInnes if (a->j[j] >= i) { 786aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 788496be53dSLois Curfman McInnes #else 789496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 790496be53dSLois Curfman McInnes #endif 791496be53dSLois Curfman McInnes } 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 7942e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7962e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7972205254eSKarl Rupp if (i + 4 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7992205254eSKarl Rupp } else if (i + 3 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8012205254eSKarl Rupp } else if (i + 2 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8032205254eSKarl Rupp } else if (i + 1 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8052205254eSKarl Rupp } else if (i < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8072205254eSKarl Rupp } else { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8092205254eSKarl Rupp } 810496be53dSLois Curfman McInnes } 8119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8129566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 813496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8159566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 816496be53dSLois Curfman McInnes } 8179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 822496be53dSLois Curfman McInnes if (a->j[j] >= i) { 823aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82448a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 825496be53dSLois Curfman McInnes #else 8269566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 827496be53dSLois Curfman McInnes #endif 828496be53dSLois Curfman McInnes } 829496be53dSLois Curfman McInnes } 8309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 833fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83497f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83587828ca2SBarry Smith PetscScalar value; 83668f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83768f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83868f1ed48SBarry Smith 83968f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84068f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84168f1ed48SBarry Smith realonly = PETSC_FALSE; 84268f1ed48SBarry Smith break; 84368f1ed48SBarry Smith } 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith #endif 84602594712SBarry Smith 8479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84802594712SBarry Smith for (i = 0; i < m; i++) { 84902594712SBarry Smith jcnt = 0; 850d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 851e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85202594712SBarry Smith value = a->a[cnt++]; 853e24b481bSBarry Smith jcnt++; 85402594712SBarry Smith } else { 85502594712SBarry Smith value = 0.0; 85602594712SBarry Smith } 857aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85868f1ed48SBarry Smith if (realonly) { 8599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86068f1ed48SBarry Smith } else { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86268f1ed48SBarry Smith } 86302594712SBarry Smith #else 8649566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86502594712SBarry Smith #endif 86602594712SBarry Smith } 8679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8703c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 871150b93efSMatthew G. Knepley PetscInt fshift = 1; 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8733c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8753c215bfdSMatthew Knepley #else 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8773c215bfdSMatthew Knepley #endif 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8793c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8813c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8833c215bfdSMatthew Knepley #else 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8853c215bfdSMatthew Knepley #endif 8863c215bfdSMatthew Knepley } 8873c215bfdSMatthew Knepley } 8889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8893a40ed3dSBarry Smith } else { 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 891d5f3da31SBarry Smith if (A->factortype) { 89216cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89416cd7e1dSShri Abhyankar /* L part */ 89560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90116cd7e1dSShri Abhyankar } else { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90316cd7e1dSShri Abhyankar } 90416cd7e1dSShri Abhyankar #else 9059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90616cd7e1dSShri Abhyankar #endif 90716cd7e1dSShri Abhyankar } 90816cd7e1dSShri Abhyankar /* diagonal */ 90916cd7e1dSShri Abhyankar j = a->diag[i]; 91016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91516cd7e1dSShri Abhyankar } else { 9169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91716cd7e1dSShri Abhyankar } 91816cd7e1dSShri Abhyankar #else 9199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92016cd7e1dSShri Abhyankar #endif 92116cd7e1dSShri Abhyankar 92216cd7e1dSShri Abhyankar /* U part */ 92360e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92916cd7e1dSShri Abhyankar } else { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93116cd7e1dSShri Abhyankar } 93216cd7e1dSShri Abhyankar #else 9339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93416cd7e1dSShri Abhyankar #endif 93516cd7e1dSShri Abhyankar } 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93716cd7e1dSShri Abhyankar } 93816cd7e1dSShri Abhyankar } else { 93917ab2063SBarry Smith for (i = 0; i < m; i++) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 942aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94536db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9473a40ed3dSBarry Smith } else { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94917ab2063SBarry Smith } 95017ab2063SBarry Smith #else 9519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95217ab2063SBarry Smith #endif 95317ab2063SBarry Smith } 9549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95517ab2063SBarry Smith } 95616cd7e1dSShri Abhyankar } 9579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95817ab2063SBarry Smith } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 961416022c9SBarry Smith } 962416022c9SBarry Smith 9639804daf3SBarry Smith #include <petscdraw.h> 964ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 965d71ae5a4SJacob Faibussowitsch { 966480ef9eaSBarry Smith Mat A = (Mat)Aa; 967416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 968383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 969383922c3SLisandro Dalcin int color; 970b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 971b0a32e0cSBarry Smith PetscViewer viewer; 972f3ef73ceSBarry Smith PetscViewerFormat format; 973fff043a9SJunchao Zhang const PetscScalar *aa; 974cddf8d76SBarry Smith 9753a40ed3dSBarry Smith PetscFunctionBegin; 9769566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9779566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9789566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 979383922c3SLisandro Dalcin 980416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 982fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 983d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9840513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 985b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 986416022c9SBarry Smith for (i = 0; i < m; i++) { 9879371c9d4SSatish Balay y_l = m - i - 1.0; 9889371c9d4SSatish Balay y_r = y_l + 1.0; 989bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9909371c9d4SSatish Balay x_l = a->j[j]; 9919371c9d4SSatish Balay x_r = x_l + 1.0; 992fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9939566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 994cddf8d76SBarry Smith } 995cddf8d76SBarry Smith } 996b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 997cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9989371c9d4SSatish Balay y_l = m - i - 1.0; 9999371c9d4SSatish Balay y_r = y_l + 1.0; 1000bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10019371c9d4SSatish Balay x_l = a->j[j]; 10029371c9d4SSatish Balay x_r = x_l + 1.0; 1003fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10049566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1005cddf8d76SBarry Smith } 1006cddf8d76SBarry Smith } 1007b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1008cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10099371c9d4SSatish Balay y_l = m - i - 1.0; 10109371c9d4SSatish Balay y_r = y_l + 1.0; 1011bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10129371c9d4SSatish Balay x_l = a->j[j]; 10139371c9d4SSatish Balay x_r = x_l + 1.0; 1014fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10159566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1016416022c9SBarry Smith } 1017416022c9SBarry Smith } 1018d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10190513a670SBarry Smith } else { 10200513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10210513a670SBarry Smith /* first determine max of all nonzero values */ 1022b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1023383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1024b0a32e0cSBarry Smith PetscDraw popup; 10250513a670SBarry Smith 10260513a670SBarry Smith for (i = 0; i < nz; i++) { 1027fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10280513a670SBarry Smith } 1029383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10309566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1032383922c3SLisandro Dalcin 1033d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10340513a670SBarry Smith for (i = 0; i < m; i++) { 1035383922c3SLisandro Dalcin y_l = m - i - 1.0; 1036383922c3SLisandro Dalcin y_r = y_l + 1.0; 1037bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1038383922c3SLisandro Dalcin x_l = a->j[j]; 1039383922c3SLisandro Dalcin x_r = x_l + 1.0; 1040fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10419566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10420513a670SBarry Smith count++; 10430513a670SBarry Smith } 10440513a670SBarry Smith } 1045d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10460513a670SBarry Smith } 10479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1049480ef9eaSBarry Smith } 1050cddf8d76SBarry Smith 10519804daf3SBarry Smith #include <petscdraw.h> 1052ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1053d71ae5a4SJacob Faibussowitsch { 1054b0a32e0cSBarry Smith PetscDraw draw; 105536db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1056ace3abfcSBarry Smith PetscBool isnull; 1057480ef9eaSBarry Smith 1058480ef9eaSBarry Smith PetscFunctionBegin; 10599566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10609566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10613ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1062480ef9eaSBarry Smith 10639371c9d4SSatish Balay xr = A->cmap->n; 10649371c9d4SSatish Balay yr = A->rmap->n; 10659371c9d4SSatish Balay h = yr / 10.0; 10669371c9d4SSatish Balay w = xr / 10.0; 10679371c9d4SSatish Balay xr += w; 10689371c9d4SSatish Balay yr += h; 10699371c9d4SSatish Balay xl = -w; 10709371c9d4SSatish Balay yl = -h; 10719566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10729566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1077416022c9SBarry Smith } 1078416022c9SBarry Smith 1079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1080d71ae5a4SJacob Faibussowitsch { 1081ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1082416022c9SBarry Smith 10833a40ed3dSBarry Smith PetscFunctionBegin; 10849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10871baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10881baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10891baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10909566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109217ab2063SBarry Smith } 109319bcc07fSBarry Smith 1094d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1095d71ae5a4SJacob Faibussowitsch { 1096416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1097580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1098bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 109954f21887SBarry Smith MatScalar *aa = a->a, *ap; 11003447b6efSHong Zhang PetscReal ratio = 0.6; 110117ab2063SBarry Smith 11023a40ed3dSBarry Smith PetscFunctionBegin; 11033ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1105b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1106b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11079566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1109b215bc84SStefano Zampini } 111017ab2063SBarry Smith 111143ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111217ab2063SBarry Smith for (i = 1; i < m; i++) { 1113416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111417ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111594a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111617ab2063SBarry Smith if (fshift) { 1117bfeeae90SHong Zhang ip = aj + ai[i]; 1118bfeeae90SHong Zhang ap = aa + ai[i]; 111917ab2063SBarry Smith N = ailen[i]; 11209566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112148a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112217ab2063SBarry Smith } 112317ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112417ab2063SBarry Smith } 112517ab2063SBarry Smith if (m) { 112617ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112717ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112817ab2063SBarry Smith } 112917ab2063SBarry Smith /* reset ilen and imax for each row */ 11307b083b7cSBarry Smith a->nonzerorowcnt = 0; 1131396832f4SHong Zhang if (A->structure_only) { 11329566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1134396832f4SHong Zhang } else { /* !A->structure_only */ 113517ab2063SBarry Smith for (i = 0; i < m; i++) { 113617ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11377b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113817ab2063SBarry Smith } 1139396832f4SHong Zhang } 1140bfeeae90SHong Zhang a->nz = ai[m]; 1141aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1142bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1143bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1144bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1145bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1146bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1147bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1148bc43efbbSJunchao Zhang break; 1149bc43efbbSJunchao Zhang } 1150bc43efbbSJunchao Zhang } 11519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11542205254eSKarl Rupp 11558e58a170SBarry Smith A->info.mallocs += a->reallocs; 1156dd5f02e7SSatish Balay a->reallocs = 0; 11576712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115836db0b34SBarry Smith a->rmax = rmax; 11594e220ebcSLois Curfman McInnes 116048a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11619566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116317ab2063SBarry Smith } 116417ab2063SBarry Smith 1165ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1166d71ae5a4SJacob Faibussowitsch { 116799cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116899cafbc1SBarry Smith PetscInt i, nz = a->nz; 11692e5835c6SStefano Zampini MatScalar *aa; 117099cafbc1SBarry Smith 117199cafbc1SBarry Smith PetscFunctionBegin; 11729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117399cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117799cafbc1SBarry Smith } 117899cafbc1SBarry Smith 1179ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1180d71ae5a4SJacob Faibussowitsch { 118199cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118299cafbc1SBarry Smith PetscInt i, nz = a->nz; 11832e5835c6SStefano Zampini MatScalar *aa; 118499cafbc1SBarry Smith 118599cafbc1SBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118799cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119199cafbc1SBarry Smith } 119299cafbc1SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1194d71ae5a4SJacob Faibussowitsch { 1195fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1196fff043a9SJunchao Zhang MatScalar *aa; 11973a40ed3dSBarry Smith 11983a40ed3dSBarry Smith PetscFunctionBegin; 11999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12009566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120417ab2063SBarry Smith } 1205416022c9SBarry Smith 1206d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1207d71ae5a4SJacob Faibussowitsch { 1208416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1209d5d45c9bSBarry Smith 12103a40ed3dSBarry Smith PetscFunctionBegin; 1211b4e2f619SBarry Smith if (A->hash_active) { 1212e3c72094SPierre Jolivet A->ops[0] = a->cops; 1213b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1214b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1215b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1216b4e2f619SBarry Smith } 1217b4e2f619SBarry Smith 12183ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12199566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12209566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12299566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12309566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12329566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12339566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1234901853e0SKris Buschelman 12356718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12366718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12376718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12386718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12396718818eSStefano Zampini due to different matrix sizes */ 12409566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12416718818eSStefano Zampini 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12432e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12512e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12522e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12532e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12542e956fe4SStefano Zampini #endif 12554222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12594222ddf1SHong Zhang #endif 1260d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1261d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1262d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1264d5e393b6SSuyash Tandon #endif 12653d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12673d0639e7SStefano Zampini #endif 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1269af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1271af8000cdSHong Zhang #endif 1272d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1274d24d4204SJose E. Roman #endif 127563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127863c07aadSStefano Zampini #endif 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12832e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12942e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12952e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12962e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130217ab2063SBarry Smith } 130317ab2063SBarry Smith 1304d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1305d71ae5a4SJacob Faibussowitsch { 1306416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13073a40ed3dSBarry Smith 13083a40ed3dSBarry Smith PetscFunctionBegin; 1309a65d3064SKris Buschelman switch (op) { 1310d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1311d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1312d71ae5a4SJacob Faibussowitsch break; 1313d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1314d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1315d71ae5a4SJacob Faibussowitsch break; 1316d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1317d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1318d71ae5a4SJacob Faibussowitsch break; 1319d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1320d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1321d71ae5a4SJacob Faibussowitsch break; 1322d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1323d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1324d71ae5a4SJacob Faibussowitsch break; 1325d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1326d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1327d71ae5a4SJacob Faibussowitsch break; 1328d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1329d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1330d71ae5a4SJacob Faibussowitsch break; 13313d472b54SHong Zhang case MAT_SPD: 1332b1646e73SJed Brown case MAT_SYMMETRIC: 1333b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1334b1646e73SJed Brown case MAT_HERMITIAN: 1335b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1336957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1337b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1338b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1339b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13405021d80fSJed Brown break; 13418c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1342a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1343d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1344d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1345d71ae5a4SJacob Faibussowitsch break; 1346d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1347d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1348d71ae5a4SJacob Faibussowitsch break; 1349d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1350d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1351d71ae5a4SJacob Faibussowitsch break; 1352071fcb05SBarry Smith case MAT_SORTED_FULL: 1353071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1354071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1355071fcb05SBarry Smith break; 1356d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1357d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1358d71ae5a4SJacob Faibussowitsch break; 1359d71ae5a4SJacob Faibussowitsch default: 1360d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1361a65d3064SKris Buschelman } 13623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136317ab2063SBarry Smith } 136417ab2063SBarry Smith 1365ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1366d71ae5a4SJacob Faibussowitsch { 1367416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1368fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1369c898d852SStefano Zampini PetscScalar *x; 1370c898d852SStefano Zampini const PetscScalar *aa; 137117ab2063SBarry Smith 13723a40ed3dSBarry Smith PetscFunctionBegin; 13739566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1376d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1377d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13789566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13792c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138335e7444dSHong Zhang } 138435e7444dSHong Zhang 13859566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138635e7444dSHong Zhang for (i = 0; i < n; i++) { 1387fdc842d1SBarry Smith x[i] = 0.0; 138835e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 138935e7444dSHong Zhang if (aj[j] == i) { 139035e7444dSHong Zhang x[i] = aa[j]; 139117ab2063SBarry Smith break; 139217ab2063SBarry Smith } 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 13959566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139817ab2063SBarry Smith } 139917ab2063SBarry Smith 1400c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1401d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1402d71ae5a4SJacob Faibussowitsch { 1403416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14045f22a7b3SSebastian Grimberg const MatScalar *aa; 1405d9ca1df4SBarry Smith PetscScalar *y; 1406d9ca1df4SBarry Smith const PetscScalar *x; 1407d0f46423SBarry Smith PetscInt m = A->rmap->n; 14085c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14095f22a7b3SSebastian Grimberg const MatScalar *v; 1410a77337e4SBarry Smith PetscScalar alpha; 1411d9ca1df4SBarry Smith PetscInt n, i, j; 1412d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14133447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1414ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14155c897100SBarry Smith #endif 141617ab2063SBarry Smith 14173a40ed3dSBarry Smith PetscFunctionBegin; 14189566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14199566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14225c897100SBarry Smith 14235c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1424fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14255c897100SBarry Smith #else 14263447b6efSHong Zhang if (usecprow) { 14273447b6efSHong Zhang m = cprow.nrows; 14283447b6efSHong Zhang ii = cprow.i; 14297b2bb3b9SHong Zhang ridx = cprow.rindex; 14303447b6efSHong Zhang } else { 14313447b6efSHong Zhang ii = a->i; 14323447b6efSHong Zhang } 143317ab2063SBarry Smith for (i = 0; i < m; i++) { 14343447b6efSHong Zhang idx = a->j + ii[i]; 1435fff043a9SJunchao Zhang v = aa + ii[i]; 14363447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14373447b6efSHong Zhang if (usecprow) { 14387b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14393447b6efSHong Zhang } else { 144017ab2063SBarry Smith alpha = x[i]; 14413447b6efSHong Zhang } 144204fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144317ab2063SBarry Smith } 14445c897100SBarry Smith #endif 14459566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145017ab2063SBarry Smith } 145117ab2063SBarry Smith 1452d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1453d71ae5a4SJacob Faibussowitsch { 14545c897100SBarry Smith PetscFunctionBegin; 14559566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14569566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14585c897100SBarry Smith } 14595c897100SBarry Smith 1460c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146178b84d54SShri Abhyankar 1462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1463d71ae5a4SJacob Faibussowitsch { 1464416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1465d9fead3dSBarry Smith PetscScalar *y; 146654f21887SBarry Smith const PetscScalar *x; 1467fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1468003131ecSBarry Smith PetscInt m = A->rmap->n; 14690298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14707b083b7cSBarry Smith PetscInt n, i; 1471362ced78SSatish Balay PetscScalar sum; 1472ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147317ab2063SBarry Smith 1474b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147597952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1476fee21e36SBarry Smith #endif 1477fee21e36SBarry Smith 14783a40ed3dSBarry Smith PetscFunctionBegin; 1479b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14809566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1482b215bc84SStefano Zampini } 14839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14849566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1486416022c9SBarry Smith ii = a->i; 14874eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14889566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148997952fefSHong Zhang m = a->compressedrow.nrows; 149097952fefSHong Zhang ii = a->compressedrow.i; 149197952fefSHong Zhang ridx = a->compressedrow.rindex; 149297952fefSHong Zhang for (i = 0; i < m; i++) { 149397952fefSHong Zhang n = ii[i + 1] - ii[i]; 149497952fefSHong Zhang aj = a->j + ii[i]; 1495fff043a9SJunchao Zhang aa = a_a + ii[i]; 149697952fefSHong Zhang sum = 0.0; 1497003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1498003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149997952fefSHong Zhang y[*ridx++] = sum; 150097952fefSHong Zhang } 150197952fefSHong Zhang } else { /* do not use compressed row format */ 1502b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15033d3eaba7SBarry Smith aj = a->j; 1504fff043a9SJunchao Zhang aa = a_a; 1505b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1506b05257ddSBarry Smith #else 150717ab2063SBarry Smith for (i = 0; i < m; i++) { 1508003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1509003131ecSBarry Smith aj = a->j + ii[i]; 1510fff043a9SJunchao Zhang aa = a_a + ii[i]; 151117ab2063SBarry Smith sum = 0.0; 1512003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151317ab2063SBarry Smith y[i] = sum; 151417ab2063SBarry Smith } 15158d195f9aSBarry Smith #endif 1516b05257ddSBarry Smith } 15179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152217ab2063SBarry Smith } 152317ab2063SBarry Smith 1524ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1525ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1526d71ae5a4SJacob Faibussowitsch { 1527b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1528b434eb95SMatthew G. Knepley PetscScalar *y; 1529b434eb95SMatthew G. Knepley const PetscScalar *x; 1530fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1531b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1532b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1533b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1534b434eb95SMatthew G. Knepley PetscScalar sum; 1535b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1536b434eb95SMatthew G. Knepley 1537b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1538b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1539b434eb95SMatthew G. Knepley #endif 1540b434eb95SMatthew G. Knepley 1541b434eb95SMatthew G. Knepley PetscFunctionBegin; 15429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1545b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1546b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1547b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1548b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1549b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1550b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1551b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1552fff043a9SJunchao Zhang aa = a_a + ii[i]; 1553b434eb95SMatthew G. Knepley sum = 0.0; 1554b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1555b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1556b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1557b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1558b434eb95SMatthew G. Knepley } 1559b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15603d3eaba7SBarry Smith ii = a->i; 1561b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1562b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1563b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1564fff043a9SJunchao Zhang aa = a_a + ii[i]; 1565b434eb95SMatthew G. Knepley sum = 0.0; 1566b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1567b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1568b434eb95SMatthew G. Knepley y[i] = sum; 1569b434eb95SMatthew G. Knepley } 1570b434eb95SMatthew G. Knepley } 15719566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15729566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1576b434eb95SMatthew G. Knepley } 1577b434eb95SMatthew G. Knepley 1578ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1579ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1580d71ae5a4SJacob Faibussowitsch { 1581b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1582b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1583b434eb95SMatthew G. Knepley const PetscScalar *x; 1584fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1585b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1586b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1587b434eb95SMatthew G. Knepley PetscScalar sum; 1588b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1589b434eb95SMatthew G. Knepley 1590b434eb95SMatthew G. Knepley PetscFunctionBegin; 15919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15929566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15939566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1594b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159548a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1596b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1597b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1598b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1599b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1600b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1601b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1602fff043a9SJunchao Zhang aa = a_a + ii[i]; 1603b434eb95SMatthew G. Knepley sum = y[*ridx]; 1604b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1605b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1606b434eb95SMatthew G. Knepley } 1607b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16083d3eaba7SBarry Smith ii = a->i; 1609b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1610b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1611b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1612fff043a9SJunchao Zhang aa = a_a + ii[i]; 1613b434eb95SMatthew G. Knepley sum = y[i]; 1614b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1615b434eb95SMatthew G. Knepley z[i] = sum; 1616b434eb95SMatthew G. Knepley } 1617b434eb95SMatthew G. Knepley } 16189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1623b434eb95SMatthew G. Knepley } 1624b434eb95SMatthew G. Knepley 1625c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1626d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1627d71ae5a4SJacob Faibussowitsch { 1628416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1629f15663dcSBarry Smith PetscScalar *y, *z; 1630f15663dcSBarry Smith const PetscScalar *x; 1631fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1632d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1633d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1634362ced78SSatish Balay PetscScalar sum; 1635ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16369ea0dfa2SSatish Balay 16373a40ed3dSBarry Smith PetscFunctionBegin; 1638b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16399566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1641b215bc84SStefano Zampini } 16429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16449566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16454eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164797952fefSHong Zhang m = a->compressedrow.nrows; 164897952fefSHong Zhang ii = a->compressedrow.i; 164997952fefSHong Zhang ridx = a->compressedrow.rindex; 165097952fefSHong Zhang for (i = 0; i < m; i++) { 165197952fefSHong Zhang n = ii[i + 1] - ii[i]; 165297952fefSHong Zhang aj = a->j + ii[i]; 1653fff043a9SJunchao Zhang aa = a_a + ii[i]; 165497952fefSHong Zhang sum = y[*ridx]; 1655f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165697952fefSHong Zhang z[*ridx++] = sum; 165797952fefSHong Zhang } 165897952fefSHong Zhang } else { /* do not use compressed row format */ 16593d3eaba7SBarry Smith ii = a->i; 1660f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16613d3eaba7SBarry Smith aj = a->j; 1662fff043a9SJunchao Zhang aa = a_a; 1663f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1664f15663dcSBarry Smith #else 166517ab2063SBarry Smith for (i = 0; i < m; i++) { 1666f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1667f15663dcSBarry Smith aj = a->j + ii[i]; 1668fff043a9SJunchao Zhang aa = a_a + ii[i]; 166917ab2063SBarry Smith sum = y[i]; 1670f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167117ab2063SBarry Smith z[i] = sum; 167217ab2063SBarry Smith } 167302ab625aSSatish Balay #endif 1674f15663dcSBarry Smith } 16759566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168017ab2063SBarry Smith } 168117ab2063SBarry Smith 168217ab2063SBarry Smith /* 168317ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168417ab2063SBarry Smith */ 1685d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1686d71ae5a4SJacob Faibussowitsch { 1687416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1688d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1689c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169017ab2063SBarry Smith 16913a40ed3dSBarry Smith PetscFunctionBegin; 169209f38230SBarry Smith if (!a->diag) { 16939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1694c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169509f38230SBarry Smith } 1696d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1697c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1698c0c07093SJunchao Zhang if (alreadySet) { 1699c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1700c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1701c0c07093SJunchao Zhang } 1702c0c07093SJunchao Zhang 170309f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1704bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1705bfeeae90SHong Zhang if (a->j[j] == i) { 170609f38230SBarry Smith a->diag[i] = j; 170717ab2063SBarry Smith break; 170817ab2063SBarry Smith } 170917ab2063SBarry Smith } 171017ab2063SBarry Smith } 17113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171217ab2063SBarry Smith } 171317ab2063SBarry Smith 1714ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1715d71ae5a4SJacob Faibussowitsch { 171661ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171761ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171861ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171961ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172061ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172161ecd0c6SBarry Smith 172261ecd0c6SBarry Smith PetscFunctionBegin; 172361ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17259566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172761ecd0c6SBarry Smith } 172861ecd0c6SBarry Smith 172961ecd0c6SBarry Smith if (a->diagonaldense) { 173061ecd0c6SBarry Smith cnt = 0; 173161ecd0c6SBarry Smith } else { 17329566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173361ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1734349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173561ecd0c6SBarry Smith cnt++; 173661ecd0c6SBarry Smith mdiag[i] = 1; 173761ecd0c6SBarry Smith } 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith if (!cnt) { 17419566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174261ecd0c6SBarry Smith } else { 1743b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1744b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174561ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 17466ea2a7edSJunchao Zhang const PetscScalar *Aa; 17476ea2a7edSJunchao Zhang 17486ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17496ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 175061ecd0c6SBarry Smith 175161ecd0c6SBarry Smith a->a = NULL; 175261ecd0c6SBarry Smith a->j = NULL; 175361ecd0c6SBarry Smith a->i = NULL; 175461ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1755ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175761ecd0c6SBarry Smith 175861ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175961ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17609566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176148a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1762447d62f5SStefano Zampini } 17639566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17649566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176561ecd0c6SBarry Smith if (singlemalloc) { 17669566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176761ecd0c6SBarry Smith } else { 17689566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17699566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17709566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177161ecd0c6SBarry Smith } 177261ecd0c6SBarry Smith } 17739566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177461ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177661ecd0c6SBarry Smith } 177761ecd0c6SBarry Smith 1778be5855fcSBarry Smith /* 1779be5855fcSBarry Smith Checks for missing diagonals 1780be5855fcSBarry Smith */ 1781d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1782d71ae5a4SJacob Faibussowitsch { 1783be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17847734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1785be5855fcSBarry Smith 1786be5855fcSBarry Smith PetscFunctionBegin; 178709f38230SBarry Smith *missing = PETSC_FALSE; 17887734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 178909f38230SBarry Smith *missing = PETSC_TRUE; 179009f38230SBarry Smith if (d) *d = 0; 17919566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179209f38230SBarry Smith } else { 179301445905SHong Zhang PetscInt n; 179401445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1795f1e2ffcdSBarry Smith diag = a->diag; 179601445905SHong Zhang for (i = 0; i < n; i++) { 17977734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179809f38230SBarry Smith *missing = PETSC_TRUE; 179909f38230SBarry Smith if (d) *d = i; 18009566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1801358d2f5dSShri Abhyankar break; 180209f38230SBarry Smith } 1803be5855fcSBarry Smith } 1804be5855fcSBarry Smith } 18053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1806be5855fcSBarry Smith } 1807be5855fcSBarry Smith 18080da83c2eSBarry Smith #include <petscblaslapack.h> 18090da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18100da83c2eSBarry Smith 18110da83c2eSBarry Smith /* 18120da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18130da83c2eSBarry Smith */ 1814ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1815d71ae5a4SJacob Faibussowitsch { 18160da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18170da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18180da83c2eSBarry Smith const PetscReal shift = 0.0; 18190da83c2eSBarry Smith PetscInt ipvt[5]; 18204e208921SJed Brown PetscCount flops = 0; 18210da83c2eSBarry Smith PetscScalar work[25], *v_work; 18220da83c2eSBarry Smith 18230da83c2eSBarry Smith PetscFunctionBegin; 18240da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18250da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182608401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1827ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 182948a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18300da83c2eSBarry Smith ncnt = 0; 18310da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18320da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18339566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18340da83c2eSBarry Smith switch (bsizes[i]) { 1835d71ae5a4SJacob Faibussowitsch case 1: 1836d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1837d71ae5a4SJacob Faibussowitsch break; 18380da83c2eSBarry Smith case 2: 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18400da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18420da83c2eSBarry Smith break; 18430da83c2eSBarry Smith case 3: 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18450da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18470da83c2eSBarry Smith break; 18480da83c2eSBarry Smith case 4: 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18500da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18520da83c2eSBarry Smith break; 18530da83c2eSBarry Smith case 5: 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18550da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18570da83c2eSBarry Smith break; 18580da83c2eSBarry Smith case 6: 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18600da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18620da83c2eSBarry Smith break; 18630da83c2eSBarry Smith case 7: 18649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18650da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18670da83c2eSBarry Smith break; 18680da83c2eSBarry Smith default: 18699566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18700da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18720da83c2eSBarry Smith } 18730da83c2eSBarry Smith ncnt += bsizes[i]; 18740da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1875baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18760da83c2eSBarry Smith } 18773ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187848a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18799566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18810da83c2eSBarry Smith } 18820da83c2eSBarry Smith 1883422a814eSBarry Smith /* 1884422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1885422a814eSBarry Smith */ 1886ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1887d71ae5a4SJacob Faibussowitsch { 188871f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1889d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18902e5835c6SStefano Zampini const MatScalar *v; 189154f21887SBarry Smith PetscScalar *idiag, *mdiag; 189271f1c65dSBarry Smith 189371f1c65dSBarry Smith PetscFunctionBegin; 18943ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18959566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189671f1c65dSBarry Smith diag = a->diag; 18974dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18982e5835c6SStefano Zampini 189971f1c65dSBarry Smith mdiag = a->mdiag; 190071f1c65dSBarry Smith idiag = a->idiag; 19019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1902422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190371f1c65dSBarry Smith for (i = 0; i < m; i++) { 190471f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1905899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1906899639b0SHong Zhang if (PetscRealPart(fshift)) { 19079566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19087b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19097b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19107b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1912899639b0SHong Zhang } 191371f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191471f1c65dSBarry Smith } 19159566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191671f1c65dSBarry Smith } else { 191771f1c65dSBarry Smith for (i = 0; i < m; i++) { 191871f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 191971f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192071f1c65dSBarry Smith } 19219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192271f1c65dSBarry Smith } 192371f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192671f1c65dSBarry Smith } 192771f1c65dSBarry Smith 1928d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1929d71ae5a4SJacob Faibussowitsch { 1930416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1931e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19322e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193354f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19343d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193597f1f81fSBarry Smith const PetscInt *idx, *diag; 193617ab2063SBarry Smith 19373a40ed3dSBarry Smith PetscFunctionBegin; 1938b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19399566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1941b215bc84SStefano Zampini } 1942b965ef7fSBarry Smith its = its * lits; 194391723122SBarry Smith 194471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19459566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194671f1c65dSBarry Smith a->fshift = fshift; 194771f1c65dSBarry Smith a->omega = omega; 1948ed480e8bSBarry Smith 194971f1c65dSBarry Smith diag = a->diag; 195071f1c65dSBarry Smith t = a->ssor_work; 1951ed480e8bSBarry Smith idiag = a->idiag; 195271f1c65dSBarry Smith mdiag = a->mdiag; 1953ed480e8bSBarry Smith 19549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19559566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19569566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1957ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195817ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195917ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1960ed480e8bSBarry Smith bs = b; 196117ab2063SBarry Smith for (i = 0; i < m; i++) { 196271f1c65dSBarry Smith d = fshift + mdiag[i]; 1963416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1964ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19652e5835c6SStefano Zampini v = aa + diag[i] + 1; 196617ab2063SBarry Smith sum = b[i] * d / omega; 1967003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196817ab2063SBarry Smith x[i] = sum; 196917ab2063SBarry Smith } 19709566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19739566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197517ab2063SBarry Smith } 1976c783ea89SBarry Smith 197708401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1978f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19794c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1980887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198117ab2063SBarry Smith 198217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198317ab2063SBarry Smith 1984887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198517ab2063SBarry Smith */ 198617ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198717ab2063SBarry Smith 198817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1990416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1991ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19922e5835c6SStefano Zampini v = aa + diag[i] + 1; 199317ab2063SBarry Smith sum = b[i]; 1994e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1995ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199617ab2063SBarry Smith } 199717ab2063SBarry Smith 199817ab2063SBarry Smith /* t = b - (2*E - D)x */ 19992e5835c6SStefano Zampini v = aa; 20002205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200117ab2063SBarry Smith 200217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2003ed480e8bSBarry Smith ts = t; 2004416022c9SBarry Smith diag = a->diag; 200517ab2063SBarry Smith for (i = 0; i < m; i++) { 2006416022c9SBarry Smith n = diag[i] - a->i[i]; 2007ed480e8bSBarry Smith idx = a->j + a->i[i]; 20082e5835c6SStefano Zampini v = aa + a->i[i]; 200917ab2063SBarry Smith sum = t[i]; 2010003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2011ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2012733d66baSBarry Smith /* x = x + t */ 2013733d66baSBarry Smith x[i] += t[i]; 201417ab2063SBarry Smith } 201517ab2063SBarry Smith 20169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20179566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202017ab2063SBarry Smith } 202117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202317ab2063SBarry Smith for (i = 0; i < m; i++) { 2024416022c9SBarry Smith n = diag[i] - a->i[i]; 2025ed480e8bSBarry Smith idx = a->j + a->i[i]; 20262e5835c6SStefano Zampini v = aa + a->i[i]; 202717ab2063SBarry Smith sum = b[i]; 2028e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20295c99c7daSBarry Smith t[i] = sum; 2030ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203117ab2063SBarry Smith } 20325c99c7daSBarry Smith xb = t; 20339566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20343a40ed3dSBarry Smith } else xb = b; 203517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2037416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2038ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20392e5835c6SStefano Zampini v = aa + diag[i] + 1; 204017ab2063SBarry Smith sum = xb[i]; 2041e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20425c99c7daSBarry Smith if (xb == b) { 2043ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20445c99c7daSBarry Smith } else { 2045b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204617ab2063SBarry Smith } 20475c99c7daSBarry Smith } 20489566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204917ab2063SBarry Smith } 205017ab2063SBarry Smith its--; 205117ab2063SBarry Smith } 205217ab2063SBarry Smith while (its--) { 205317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205417ab2063SBarry Smith for (i = 0; i < m; i++) { 2055b19a5dc2SMark Adams /* lower */ 2056b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2057ed480e8bSBarry Smith idx = a->j + a->i[i]; 20582e5835c6SStefano Zampini v = aa + a->i[i]; 205917ab2063SBarry Smith sum = b[i]; 2060e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2061b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2062b19a5dc2SMark Adams /* upper */ 2063b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2064b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20652e5835c6SStefano Zampini v = aa + diag[i] + 1; 2066b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2067b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206817ab2063SBarry Smith } 2069b19a5dc2SMark Adams xb = t; 20709566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2071b19a5dc2SMark Adams } else xb = b; 207217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2074b19a5dc2SMark Adams sum = xb[i]; 2075b19a5dc2SMark Adams if (xb == b) { 2076b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2077416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2078ed480e8bSBarry Smith idx = a->j + a->i[i]; 20792e5835c6SStefano Zampini v = aa + a->i[i]; 2080e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2081ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2082b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2083b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2084b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20852e5835c6SStefano Zampini v = aa + diag[i] + 1; 2086b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2087b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208817ab2063SBarry Smith } 2089b19a5dc2SMark Adams } 2090b19a5dc2SMark Adams if (xb == b) { 20919566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2092b19a5dc2SMark Adams } else { 20939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2094b19a5dc2SMark Adams } 209517ab2063SBarry Smith } 209617ab2063SBarry Smith } 20979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20989566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210117ab2063SBarry Smith } 210217ab2063SBarry Smith 2103ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2104d71ae5a4SJacob Faibussowitsch { 2105416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21064e220ebcSLois Curfman McInnes 21073a40ed3dSBarry Smith PetscFunctionBegin; 21084e220ebcSLois Curfman McInnes info->block_size = 1.0; 21093966268fSBarry Smith info->nz_allocated = a->maxnz; 21103966268fSBarry Smith info->nz_used = a->nz; 21113966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21123966268fSBarry Smith info->assemblies = A->num_ass; 21133966268fSBarry Smith info->mallocs = A->info.mallocs; 21144dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2115d5f3da31SBarry Smith if (A->factortype) { 21164e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21174e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21184e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21194e220ebcSLois Curfman McInnes } else { 21204e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21214e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21224e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21234e220ebcSLois Curfman McInnes } 21243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212517ab2063SBarry Smith } 212617ab2063SBarry Smith 2127ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2128d71ae5a4SJacob Faibussowitsch { 2129416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2130c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213197b48c8fSBarry Smith const PetscScalar *xx; 21322e5835c6SStefano Zampini PetscScalar *bb, *aa; 2133c7da8527SEric Chamberland PetscInt d = 0; 213417ab2063SBarry Smith 21353a40ed3dSBarry Smith PetscFunctionBegin; 213697b48c8fSBarry Smith if (x && b) { 21379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21389566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213997b48c8fSBarry Smith for (i = 0; i < N; i++) { 2140aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2141447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214297b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214397b48c8fSBarry Smith } 21449566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21459566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214697b48c8fSBarry Smith } 214797b48c8fSBarry Smith 21489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2149a9817697SBarry Smith if (a->keepnonzeropattern) { 2150f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2151aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21529566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2153f1e2ffcdSBarry Smith } 2154f4df32b1SMatthew Knepley if (diag != 0.0) { 2155c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2156c7da8527SEric Chamberland d = rows[i]; 2157447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215808401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2159c7da8527SEric Chamberland } 2160f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2161447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21622e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2163f1e2ffcdSBarry Smith } 2164f1e2ffcdSBarry Smith } 2165f1e2ffcdSBarry Smith } else { 2166f4df32b1SMatthew Knepley if (diag != 0.0) { 216717ab2063SBarry Smith for (i = 0; i < N; i++) { 2168aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21697ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2170447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2171447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2172447d62f5SStefano Zampini } else { 2173416022c9SBarry Smith a->ilen[rows[i]] = 1; 21742e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2175bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2176447d62f5SStefano Zampini } 2177447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21789566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217917ab2063SBarry Smith } 218017ab2063SBarry Smith } 21813a40ed3dSBarry Smith } else { 218217ab2063SBarry Smith for (i = 0; i < N; i++) { 2183aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2184416022c9SBarry Smith a->ilen[rows[i]] = 0; 218517ab2063SBarry Smith } 218617ab2063SBarry Smith } 2187e56f5c9eSBarry Smith A->nonzerostate++; 2188f1e2ffcdSBarry Smith } 21899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2190dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219217ab2063SBarry Smith } 219317ab2063SBarry Smith 2194ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2195d71ae5a4SJacob Faibussowitsch { 21966e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21976e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21982b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21996e169961SBarry Smith const PetscScalar *xx; 22002e5835c6SStefano Zampini PetscScalar *bb, *aa; 22016e169961SBarry Smith 22026e169961SBarry Smith PetscFunctionBegin; 22033ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22056e169961SBarry Smith if (x && b) { 22069566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22079566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22082b40b63fSBarry Smith vecs = PETSC_TRUE; 22096e169961SBarry Smith } 22109566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22116e169961SBarry Smith for (i = 0; i < N; i++) { 2212aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22138e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22142205254eSKarl Rupp 22156e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22166e169961SBarry Smith } 22176e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22186e169961SBarry Smith if (!zeroed[i]) { 22196e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22204cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22212e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22222e5835c6SStefano Zampini aa[j] = 0.0; 22236e169961SBarry Smith } 22246e169961SBarry Smith } 22254cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22266e169961SBarry Smith } 22276e169961SBarry Smith if (x && b) { 22289566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22299566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22306e169961SBarry Smith } 22319566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22326e169961SBarry Smith if (diag != 0.0) { 22339566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22341d5a398dSstefano_zampini if (missing) { 22351d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22364cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2237aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22389566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22391d5a398dSstefano_zampini } 22401d5a398dSstefano_zampini } else { 2241ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22426e169961SBarry Smith } 22431d5a398dSstefano_zampini } 22449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2245dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22476e169961SBarry Smith } 22486e169961SBarry Smith 2249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2250d71ae5a4SJacob Faibussowitsch { 2251fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2252fff043a9SJunchao Zhang const PetscScalar *aa; 225317ab2063SBarry Smith 22543a40ed3dSBarry Smith PetscFunctionBegin; 22559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2256416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22578e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225817ab2063SBarry Smith if (idx) { 22595c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2260f4259b30SLisandro Dalcin else *idx = NULL; 226117ab2063SBarry Smith } 22629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226417ab2063SBarry Smith } 226517ab2063SBarry Smith 2266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2267d71ae5a4SJacob Faibussowitsch { 22683a40ed3dSBarry Smith PetscFunctionBegin; 22693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227017ab2063SBarry Smith } 227117ab2063SBarry Smith 2272ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2273d71ae5a4SJacob Faibussowitsch { 2274416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22752e5835c6SStefano Zampini const MatScalar *v; 227636db0b34SBarry Smith PetscReal sum = 0.0; 227797f1f81fSBarry Smith PetscInt i, j; 227817ab2063SBarry Smith 22793a40ed3dSBarry Smith PetscFunctionBegin; 22809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228117ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2282570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2283570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2284792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2285570b7f6dSBarry Smith #else 2286416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22879371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22889371c9d4SSatish Balay v++; 228917ab2063SBarry Smith } 22908f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2291570b7f6dSBarry Smith #endif 22929566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22933a40ed3dSBarry Smith } else if (type == NORM_1) { 229436db0b34SBarry Smith PetscReal *tmp; 229597f1f81fSBarry Smith PetscInt *jj = a->j; 22969566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2297064f8208SBarry Smith *nrm = 0.0; 2298416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22999371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23009371c9d4SSatish Balay v++; 230117ab2063SBarry Smith } 2302d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2303064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230417ab2063SBarry Smith } 23059566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23073a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2308064f8208SBarry Smith *nrm = 0.0; 2309d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23108e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 231117ab2063SBarry Smith sum = 0.0; 2312416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23139371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23149371c9d4SSatish Balay v2++; 231517ab2063SBarry Smith } 2316064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231717ab2063SBarry Smith } 23189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2319f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232217ab2063SBarry Smith } 232317ab2063SBarry Smith 2324ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2325d71ae5a4SJacob Faibussowitsch { 23263d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232754f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23282e5835c6SStefano Zampini const MatScalar *va, *vb; 232997f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2330cd0d46ebSvictorle 2331cd0d46ebSvictorle PetscFunctionBegin; 23329566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23339566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23345485867bSBarry Smith if (ma != nb || na != mb) { 23355485867bSBarry Smith *f = PETSC_FALSE; 23363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23375485867bSBarry Smith } 23389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23409371c9d4SSatish Balay aii = aij->i; 23419371c9d4SSatish Balay bii = bij->i; 23429371c9d4SSatish Balay adx = aij->j; 23439371c9d4SSatish Balay bdx = bij->j; 23449566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2346cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2347cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2348cd0d46ebSvictorle 2349cd0d46ebSvictorle *f = PETSC_TRUE; 2350cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2351cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235297f1f81fSBarry Smith PetscInt idc, idr; 23535485867bSBarry Smith PetscScalar vc, vr; 2354cd0d46ebSvictorle /* column/row index/value */ 23555485867bSBarry Smith idc = adx[aptr[i]]; 23565485867bSBarry Smith idr = bdx[bptr[idc]]; 23575485867bSBarry Smith vc = va[aptr[i]]; 23585485867bSBarry Smith vr = vb[bptr[idc]]; 23595485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23605485867bSBarry Smith *f = PETSC_FALSE; 23615485867bSBarry Smith goto done; 2362cd0d46ebSvictorle } else { 23635485867bSBarry Smith aptr[i]++; 23645485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2365cd0d46ebSvictorle } 2366cd0d46ebSvictorle } 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle done: 23699566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23709566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2374cd0d46ebSvictorle } 2375cd0d46ebSvictorle 2376ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2377d71ae5a4SJacob Faibussowitsch { 23783d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237954f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238054f21887SBarry Smith MatScalar *va, *vb; 23811cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23821cbb95d3SBarry Smith 23831cbb95d3SBarry Smith PetscFunctionBegin; 23849566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23859566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23861cbb95d3SBarry Smith if (ma != nb || na != mb) { 23871cbb95d3SBarry Smith *f = PETSC_FALSE; 23883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23891cbb95d3SBarry Smith } 23909371c9d4SSatish Balay aii = aij->i; 23919371c9d4SSatish Balay bii = bij->i; 23929371c9d4SSatish Balay adx = aij->j; 23939371c9d4SSatish Balay bdx = bij->j; 23949371c9d4SSatish Balay va = aij->a; 23959371c9d4SSatish Balay vb = bij->a; 23969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23981cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23991cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24001cbb95d3SBarry Smith 24011cbb95d3SBarry Smith *f = PETSC_TRUE; 24021cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24031cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24041cbb95d3SBarry Smith PetscInt idc, idr; 24051cbb95d3SBarry Smith PetscScalar vc, vr; 24061cbb95d3SBarry Smith /* column/row index/value */ 24071cbb95d3SBarry Smith idc = adx[aptr[i]]; 24081cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24091cbb95d3SBarry Smith vc = va[aptr[i]]; 24101cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24111cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24121cbb95d3SBarry Smith *f = PETSC_FALSE; 24131cbb95d3SBarry Smith goto done; 24141cbb95d3SBarry Smith } else { 24151cbb95d3SBarry Smith aptr[i]++; 24161cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24171cbb95d3SBarry Smith } 24181cbb95d3SBarry Smith } 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith done: 24219566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24229566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24241cbb95d3SBarry Smith } 24251cbb95d3SBarry Smith 2426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2427d71ae5a4SJacob Faibussowitsch { 2428416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2429fff8e43fSBarry Smith const PetscScalar *l, *r; 2430fff8e43fSBarry Smith PetscScalar x; 243154f21887SBarry Smith MatScalar *v; 2432fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2433fff8e43fSBarry Smith const PetscInt *jj; 243417ab2063SBarry Smith 24353a40ed3dSBarry Smith PetscFunctionBegin; 243617ab2063SBarry Smith if (ll) { 24373ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24383ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24399566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 244008401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24419566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244317ab2063SBarry Smith for (i = 0; i < m; i++) { 244417ab2063SBarry Smith x = l[i]; 2445416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24462205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244717ab2063SBarry Smith } 24489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 245117ab2063SBarry Smith } 245217ab2063SBarry Smith if (rr) { 24539566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245408401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24559566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24572e5835c6SStefano Zampini jj = a->j; 24582205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24609566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 246217ab2063SBarry Smith } 24639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 246517ab2063SBarry Smith } 246617ab2063SBarry Smith 2467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2468d71ae5a4SJacob Faibussowitsch { 2469db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2470d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 247197f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24725d0c19d7SBarry Smith const PetscInt *irow, *icol; 24732e5835c6SStefano Zampini const PetscScalar *aa; 24745d0c19d7SBarry Smith PetscInt nrows, ncols; 247597f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2476fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2477416022c9SBarry Smith Mat C; 2478cdc6f3adSToby Isaac PetscBool stride; 247917ab2063SBarry Smith 24803a40ed3dSBarry Smith PetscFunctionBegin; 24819566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24829566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24839566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248417ab2063SBarry Smith 24859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2486ff718158SBarry Smith if (stride) { 24879566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2488ff718158SBarry Smith } else { 2489ff718158SBarry Smith first = 0; 2490ff718158SBarry Smith step = 0; 2491ff718158SBarry Smith } 2492fee21e36SBarry Smith if (stride && step == 1) { 249302834360SBarry Smith /* special case of contiguous rows */ 24949566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249502834360SBarry Smith /* loop over new rows determining lens and starting points */ 249602834360SBarry Smith for (i = 0; i < nrows; i++) { 2497bfeeae90SHong Zhang kstart = ai[irow[i]]; 2498a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2499a91a9bebSLisandro Dalcin starts[i] = kstart; 250002834360SBarry Smith for (k = kstart; k < kend; k++) { 2501bfeeae90SHong Zhang if (aj[k] >= first) { 250202834360SBarry Smith starts[i] = k; 250302834360SBarry Smith break; 250402834360SBarry Smith } 250502834360SBarry Smith } 2506a2744918SBarry Smith sum = 0; 250702834360SBarry Smith while (k < kend) { 2508bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2509a2744918SBarry Smith sum++; 251002834360SBarry Smith } 2511a2744918SBarry Smith lens[i] = sum; 251202834360SBarry Smith } 251302834360SBarry Smith /* create submatrix */ 2514cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251597f1f81fSBarry Smith PetscInt n_cols, n_rows; 25169566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2517aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25189566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251908480c60SBarry Smith C = *B; 25203a40ed3dSBarry Smith } else { 25213bef6203SJed Brown PetscInt rbs, cbs; 25229566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25239566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25249566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25259566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25269566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25279566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252908480c60SBarry Smith } 2530db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2531db02288aSLois Curfman McInnes 253202834360SBarry Smith /* loop over rows inserting into submatrix */ 2533fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2534db02288aSLois Curfman McInnes j_new = c->j; 2535db02288aSLois Curfman McInnes i_new = c->i; 25369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253702834360SBarry Smith for (i = 0; i < nrows; i++) { 2538a2744918SBarry Smith ii = starts[i]; 2539a2744918SBarry Smith lensi = lens[i]; 2540810441c8SPierre Jolivet if (lensi) { 2541ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25429566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2543a2744918SBarry Smith a_new += lensi; 2544810441c8SPierre Jolivet } 2545a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2546a2744918SBarry Smith c->ilen[i] = lensi; 254702834360SBarry Smith } 2548fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25509566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25513a40ed3dSBarry Smith } else { 25529566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25539566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25554dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25566bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25574dcab191SBarry Smith smap[icol[i]] = i + 1; 25584dcab191SBarry Smith } 25594dcab191SBarry Smith 256002834360SBarry Smith /* determine lens of each row */ 256102834360SBarry Smith for (i = 0; i < nrows; i++) { 2562bfeeae90SHong Zhang kstart = ai[irow[i]]; 256302834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256402834360SBarry Smith lens[i] = 0; 256502834360SBarry Smith for (k = kstart; k < kend; k++) { 2566ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256702834360SBarry Smith } 256802834360SBarry Smith } 256917ab2063SBarry Smith /* Create and fill new matrix */ 2570a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2571ace3abfcSBarry Smith PetscBool equal; 25720f5bd95cSBarry Smith 257399141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2574aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25759566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2576fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25779566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257808480c60SBarry Smith C = *B; 25793a40ed3dSBarry Smith } else { 25803bef6203SJed Brown PetscInt rbs, cbs; 25819566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25829566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25839566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25849566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 258537a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25869566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258808480c60SBarry Smith } 25899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2590fb3c7e2dSJunchao Zhang 2591f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2592fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259317ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259499141d43SSatish Balay row = irow[i]; 2595bfeeae90SHong Zhang kstart = ai[row]; 259699141d43SSatish Balay kend = kstart + a->ilen[row]; 2597bfeeae90SHong Zhang mat_i = c->i[i]; 25988e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25998e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 260099141d43SSatish Balay mat_ilen = c->ilen + i; 260117ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2602bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2603ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26042e5835c6SStefano Zampini *mat_a++ = aa[k]; 260599141d43SSatish Balay (*mat_ilen)++; 260617ab2063SBarry Smith } 260717ab2063SBarry Smith } 260817ab2063SBarry Smith } 26099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 261002834360SBarry Smith /* Free work space */ 26119566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26129566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26139566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2614cdc6f3adSToby Isaac /* sort */ 2615cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2616cdc6f3adSToby Isaac PetscInt ilen; 2617cdc6f3adSToby Isaac 2618cdc6f3adSToby Isaac mat_i = c->i[i]; 26198e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26208e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2621cdc6f3adSToby Isaac ilen = c->ilen[i]; 26229566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2623cdc6f3adSToby Isaac } 2624fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 262502834360SBarry Smith } 26268c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26279566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2628305c6ccfSStefano Zampini #endif 26299566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26309566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 263117ab2063SBarry Smith 26329566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2633416022c9SBarry Smith *B = C; 26343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 263517ab2063SBarry Smith } 263617ab2063SBarry Smith 2637ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2638d71ae5a4SJacob Faibussowitsch { 263982d44351SHong Zhang Mat B; 264082d44351SHong Zhang 264182d44351SHong Zhang PetscFunctionBegin; 2642c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26439566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26449566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26459566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26469566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26479566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264882d44351SHong Zhang *subMat = B; 2649c2d650bdSHong Zhang } else { 26509566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2651c2d650bdSHong Zhang } 26523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265382d44351SHong Zhang } 265482d44351SHong Zhang 2655ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2656d71ae5a4SJacob Faibussowitsch { 265763b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265863b91edcSBarry Smith Mat outA; 2659ace3abfcSBarry Smith PetscBool row_identity, col_identity; 266063b91edcSBarry Smith 26613a40ed3dSBarry Smith PetscFunctionBegin; 266208401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26631df811f5SHong Zhang 26649566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26659566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2666a871dcd8SBarry Smith 266763b91edcSBarry Smith outA = inA; 2668d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26699566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26709566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26712205254eSKarl Rupp 26729566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26739566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26742205254eSKarl Rupp 2675c3122656SLisandro Dalcin a->row = row; 26762205254eSKarl Rupp 26779566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26789566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26792205254eSKarl Rupp 2680c3122656SLisandro Dalcin a->col = col; 268163b91edcSBarry Smith 268236db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26839566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26849566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2685f0ec6fceSSatish Balay 268694a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268894a9d846SBarry Smith } 268963b91edcSBarry Smith 26909566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2691137fb511SHong Zhang if (row_identity && col_identity) { 26929566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2693137fb511SHong Zhang } else { 26949566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2695137fb511SHong Zhang } 26963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2697a871dcd8SBarry Smith } 2698a871dcd8SBarry Smith 2699d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2700d71ae5a4SJacob Faibussowitsch { 2701f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2702dfa0f9e5SStefano Zampini PetscScalar *v; 2703c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27043a40ed3dSBarry Smith 27053a40ed3dSBarry Smith PetscFunctionBegin; 27069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27079566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2708792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2713f0b747eeSBarry Smith } 2714f0b747eeSBarry Smith 2715d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2716d71ae5a4SJacob Faibussowitsch { 271716b64355SHong Zhang PetscInt i; 271816b64355SHong Zhang 271916b64355SHong Zhang PetscFunctionBegin; 272016b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27219566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 272216b64355SHong Zhang 272348a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27249566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272516b64355SHong Zhang 272616b64355SHong Zhang if (submatj->rbuf1) { 27279566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27289566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272916b64355SHong Zhang } 273016b64355SHong Zhang 273148a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27329566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27339566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273416b64355SHong Zhang } 273516b64355SHong Zhang 273616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2737eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27389566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27399566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 274016b64355SHong Zhang #else 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 274216b64355SHong Zhang #endif 274316b64355SHong Zhang 274416b64355SHong Zhang if (!submatj->allcolumns) { 274516b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2746eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 274716b64355SHong Zhang #else 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274916b64355SHong Zhang #endif 275016b64355SHong Zhang } 27519566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 275216b64355SHong Zhang 27539566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275516b64355SHong Zhang } 275616b64355SHong Zhang 2757d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2758d71ae5a4SJacob Faibussowitsch { 275916b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27605c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 276116b64355SHong Zhang 276216b64355SHong Zhang PetscFunctionBegin; 27639566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27649566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276616b64355SHong Zhang } 276716b64355SHong Zhang 276889a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2769ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2770d71ae5a4SJacob Faibussowitsch { 27712d033e1fSHong Zhang PetscInt i; 27720fb991dcSHong Zhang Mat C; 27730fb991dcSHong Zhang Mat_SeqAIJ *c; 27740fb991dcSHong Zhang Mat_SubSppt *submatj; 27752d033e1fSHong Zhang 27762d033e1fSHong Zhang PetscFunctionBegin; 27772d033e1fSHong Zhang for (i = 0; i < n; i++) { 27780fb991dcSHong Zhang C = (*mat)[i]; 27790fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27800fb991dcSHong Zhang submatj = c->submatis1; 27812d033e1fSHong Zhang if (submatj) { 2782682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278326cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27849566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27859566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27869566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27873faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27889566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27899566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27909566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2791682e4c99SStefano Zampini } 27922d033e1fSHong Zhang } else { 27939566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27942d033e1fSHong Zhang } 27952d033e1fSHong Zhang } 279686e85357SHong Zhang 279763a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27989566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279963a75b2aSHong Zhang 28009566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28022d033e1fSHong Zhang } 28032d033e1fSHong Zhang 2804ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2805d71ae5a4SJacob Faibussowitsch { 280697f1f81fSBarry Smith PetscInt i; 2807cddf8d76SBarry Smith 28083a40ed3dSBarry Smith PetscFunctionBegin; 280948a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2810cddf8d76SBarry Smith 281148a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2813cddf8d76SBarry Smith } 2814cddf8d76SBarry Smith 2815ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2816d71ae5a4SJacob Faibussowitsch { 2817e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28189a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28195d0c19d7SBarry Smith const PetscInt *idx; 28209a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2821f1af5d2fSBarry Smith PetscBT table; 2822bbd702dbSSatish Balay 28233a40ed3dSBarry Smith PetscFunctionBegin; 28249a88ca10SBarry Smith m = A->rmap->n / bs; 2825e4d965acSSatish Balay ai = a->i; 2826bfeeae90SHong Zhang aj = a->j; 28278a047759SSatish Balay 282808401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282906763907SSatish Balay 28309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28319566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 283206763907SSatish Balay 2833e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2834b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2835e4d965acSSatish Balay isz = 0; 28369566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2837e4d965acSSatish Balay 2838e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28399566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28409566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2841e4d965acSSatish Balay 28429a88ca10SBarry Smith if (bs > 1) { 28439a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28449a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28459a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28469a88ca10SBarry Smith } 28479a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28489a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28499a88ca10SBarry Smith 28509a88ca10SBarry Smith k = 0; 28519a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28529a88ca10SBarry Smith n = isz; 28539a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28549a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28559a88ca10SBarry Smith row = bs * nidx[k] + ll; 28569a88ca10SBarry Smith start = ai[row]; 28579a88ca10SBarry Smith end = ai[row + 1]; 28589a88ca10SBarry Smith for (l = start; l < end; l++) { 28599a88ca10SBarry Smith val = aj[l] / bs; 28609a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28619a88ca10SBarry Smith } 28629a88ca10SBarry Smith } 28639a88ca10SBarry Smith } 28649a88ca10SBarry Smith } 28659a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28669a88ca10SBarry Smith } else { 2867dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2868e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28692205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28704dcbc457SBarry Smith } 28719566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28729566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2873e4d965acSSatish Balay 287404a348a9SBarry Smith k = 0; 287504a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287604a348a9SBarry Smith n = isz; 287706763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2878e4d965acSSatish Balay row = nidx[k]; 2879e4d965acSSatish Balay start = ai[row]; 2880e4d965acSSatish Balay end = ai[row + 1]; 288104a348a9SBarry Smith for (l = start; l < end; l++) { 2882efb16452SHong Zhang val = aj[l]; 28832205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2884e4d965acSSatish Balay } 2885e4d965acSSatish Balay } 2886e4d965acSSatish Balay } 28879566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2888e4d965acSSatish Balay } 28899a88ca10SBarry Smith } 28909566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28919566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28934dcbc457SBarry Smith } 289417ab2063SBarry Smith 2895ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2896d71ae5a4SJacob Faibussowitsch { 28970513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28983b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28995d0c19d7SBarry Smith const PetscInt *row, *col; 29005d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 290156cd22aeSBarry Smith IS icolp, irowp; 29020298fd71SBarry Smith PetscInt *cwork = NULL; 29030298fd71SBarry Smith PetscScalar *vwork = NULL; 29040513a670SBarry Smith 29053a40ed3dSBarry Smith PetscFunctionBegin; 29069566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29079566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29089566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29099566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29100513a670SBarry Smith 29110513a670SBarry Smith /* determine lengths of permuted rows */ 29129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29132205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29149566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29159566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29169566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29179566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29199566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29200513a670SBarry Smith 29219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29220513a670SBarry Smith for (i = 0; i < m; i++) { 29239566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29242205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29259566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29269566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29270513a670SBarry Smith } 29289566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29292205254eSKarl Rupp 29303c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29312205254eSKarl Rupp 29328c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29339566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29349fe5e383SStefano Zampini #endif 29359566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29379566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29389566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29399566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 294148a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29430513a670SBarry Smith } 29440513a670SBarry Smith 2945d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2946d71ae5a4SJacob Faibussowitsch { 2947cb5b572fSBarry Smith PetscFunctionBegin; 294833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2950be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2951be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29522e5835c6SStefano Zampini const PetscScalar *aa; 2953be6bf707SBarry Smith 29549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295508401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29569566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29579566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2959cb5b572fSBarry Smith } else { 29609566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2961cb5b572fSBarry Smith } 29623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2963cb5b572fSBarry Smith } 2964cb5b572fSBarry Smith 2965d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2966d71ae5a4SJacob Faibussowitsch { 29676c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29686e111a19SKarl Rupp 29696c0721eeSBarry Smith PetscFunctionBegin; 29706c0721eeSBarry Smith *array = a->a; 29713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29726c0721eeSBarry Smith } 29736c0721eeSBarry Smith 2974d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2975d71ae5a4SJacob Faibussowitsch { 29766c0721eeSBarry Smith PetscFunctionBegin; 2977f38c1e66SStefano Zampini *array = NULL; 29783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29796c0721eeSBarry Smith } 2980273d9f13SBarry Smith 29818229c054SShri Abhyankar /* 29828229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29838229c054SShri Abhyankar have different nonzero structure. 29848229c054SShri Abhyankar */ 2985d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2986d71ae5a4SJacob Faibussowitsch { 2987b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2988ec7775f6SShri Abhyankar 2989ec7775f6SShri Abhyankar PetscFunctionBegin; 2990ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2991ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29928e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2993b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2994b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29958af7cee1SJed Brown nnz[i] = 0; 29968af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2997b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2998b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29998af7cee1SJed Brown nnz[i]++; 30008af7cee1SJed Brown } 30018af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3002ec7775f6SShri Abhyankar } 30033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3004ec7775f6SShri Abhyankar } 3005ec7775f6SShri Abhyankar 3006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3007d71ae5a4SJacob Faibussowitsch { 3008b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3009b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3010b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3011b264fe52SHong Zhang 3012b264fe52SHong Zhang PetscFunctionBegin; 3013b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30149566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3016b264fe52SHong Zhang } 3017b264fe52SHong Zhang 3018d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3019d71ae5a4SJacob Faibussowitsch { 3020ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3021ac90fabeSBarry Smith 3022ac90fabeSBarry Smith PetscFunctionBegin; 3023134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3024134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3025134adf20SPierre Jolivet if (e) { 30269566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302781fa06acSBarry Smith if (e) { 30289566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3029134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 303081fa06acSBarry Smith } 303181fa06acSBarry Smith } 303254c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303381fa06acSBarry Smith } 3034ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30352e5835c6SStefano Zampini const PetscScalar *xa; 30362e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303781fa06acSBarry Smith PetscBLASInt one = 1, bnz; 303881fa06acSBarry Smith 30399566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3042792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30459566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30479566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3048ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30499566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3050ac90fabeSBarry Smith } else { 30518229c054SShri Abhyankar Mat B; 30528229c054SShri Abhyankar PetscInt *nnz; 30539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30549566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30559566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30569566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30579566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30589566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30609566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30619566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30629bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30639566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3064ac90fabeSBarry Smith } 30653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3066ac90fabeSBarry Smith } 3067ac90fabeSBarry Smith 3068d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3069d71ae5a4SJacob Faibussowitsch { 3070354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3071354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3072354c94deSBarry Smith PetscInt i, nz; 3073354c94deSBarry Smith PetscScalar *a; 3074354c94deSBarry Smith 3075354c94deSBarry Smith PetscFunctionBegin; 3076354c94deSBarry Smith nz = aij->nz; 30779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30782205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3080354c94deSBarry Smith #else 3081354c94deSBarry Smith PetscFunctionBegin; 3082354c94deSBarry Smith #endif 30833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3084354c94deSBarry Smith } 3085354c94deSBarry Smith 3086ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3087d71ae5a4SJacob Faibussowitsch { 3088e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3089d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3090e34fafa9SBarry Smith PetscReal atmp; 3091985db425SBarry Smith PetscScalar *x; 3092ce496241SStefano Zampini const MatScalar *aa, *av; 3093e34fafa9SBarry Smith 3094e34fafa9SBarry Smith PetscFunctionBegin; 309528b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3097ce496241SStefano Zampini aa = av; 3098e34fafa9SBarry Smith ai = a->i; 3099e34fafa9SBarry Smith aj = a->j; 3100e34fafa9SBarry Smith 31019566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31029566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31039566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310408401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3105e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31069371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31079371c9d4SSatish Balay ai++; 3108e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3109985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31109371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31119371c9d4SSatish Balay x[i] = atmp; 31129371c9d4SSatish Balay if (idx) idx[i] = *aj; 31139371c9d4SSatish Balay } 31149371c9d4SSatish Balay aa++; 31159371c9d4SSatish Balay aj++; 3116985db425SBarry Smith } 3117985db425SBarry Smith } 31189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3121985db425SBarry Smith } 3122985db425SBarry Smith 3123eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3124eede4a3fSMark Adams { 3125eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3126eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3127eede4a3fSMark Adams PetscScalar *x; 3128eede4a3fSMark Adams const MatScalar *aa, *av; 3129eede4a3fSMark Adams 3130eede4a3fSMark Adams PetscFunctionBegin; 3131eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3132eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3133eede4a3fSMark Adams aa = av; 3134eede4a3fSMark Adams ai = a->i; 3135eede4a3fSMark Adams 3136eede4a3fSMark Adams PetscCall(VecSet(v, 0.0)); 3137eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3138eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3139eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3140eede4a3fSMark Adams for (i = 0; i < m; i++) { 3141eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3142eede4a3fSMark Adams ai++; 3143eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3144eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3145eede4a3fSMark Adams aa++; 3146eede4a3fSMark Adams } 3147eede4a3fSMark Adams } 3148eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3149eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3150eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3151eede4a3fSMark Adams } 3152eede4a3fSMark Adams 3153ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3154d71ae5a4SJacob Faibussowitsch { 3155985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3156d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3157985db425SBarry Smith PetscScalar *x; 3158ce496241SStefano Zampini const MatScalar *aa, *av; 3159985db425SBarry Smith 3160985db425SBarry Smith PetscFunctionBegin; 316128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3163ce496241SStefano Zampini aa = av; 3164985db425SBarry Smith ai = a->i; 3165985db425SBarry Smith aj = a->j; 3166985db425SBarry Smith 31679566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31689566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31699566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 317008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3171985db425SBarry Smith for (i = 0; i < m; i++) { 31729371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31739371c9d4SSatish Balay ai++; 3174d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31759371c9d4SSatish Balay x[i] = *aa; 31769371c9d4SSatish Balay if (idx) idx[i] = 0; 3177985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3178985db425SBarry Smith x[i] = 0.0; 3179985db425SBarry Smith if (idx) { 3180985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3181985db425SBarry Smith if (aj[j] > j) { 3182985db425SBarry Smith idx[i] = j; 3183985db425SBarry Smith break; 3184985db425SBarry Smith } 3185985db425SBarry Smith } 31861a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31871a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3188985db425SBarry Smith } 3189985db425SBarry Smith } 3190985db425SBarry Smith for (j = 0; j < ncols; j++) { 31919371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31929371c9d4SSatish Balay x[i] = *aa; 31939371c9d4SSatish Balay if (idx) idx[i] = *aj; 31949371c9d4SSatish Balay } 31959371c9d4SSatish Balay aa++; 31969371c9d4SSatish Balay aj++; 3197985db425SBarry Smith } 3198985db425SBarry Smith } 31999566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3202985db425SBarry Smith } 3203985db425SBarry Smith 3204ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3205d71ae5a4SJacob Faibussowitsch { 3206c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3207c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3208ce496241SStefano Zampini PetscScalar *x; 3209ce496241SStefano Zampini const MatScalar *aa, *av; 3210c87e5d42SMatthew Knepley 3211c87e5d42SMatthew Knepley PetscFunctionBegin; 32129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3213ce496241SStefano Zampini aa = av; 3214c87e5d42SMatthew Knepley ai = a->i; 3215c87e5d42SMatthew Knepley aj = a->j; 3216c87e5d42SMatthew Knepley 32179566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32189566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32199566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 322008401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3221c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32229371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32239371c9d4SSatish Balay ai++; 3224f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32259371c9d4SSatish Balay x[i] = *aa; 32269371c9d4SSatish Balay if (idx) idx[i] = 0; 3227f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3228f07e67edSHong Zhang x[i] = 0.0; 3229f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3230289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3231f07e67edSHong Zhang if (aj[j] > j) { 3232f07e67edSHong Zhang idx[i] = j; 32332205254eSKarl Rupp break; 32342205254eSKarl Rupp } 3235289a08f5SMatthew Knepley } 3236f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3237f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3238f07e67edSHong Zhang } 3239289a08f5SMatthew Knepley } 3240c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32419371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32429371c9d4SSatish Balay x[i] = *aa; 32439371c9d4SSatish Balay if (idx) idx[i] = *aj; 32449371c9d4SSatish Balay } 32459371c9d4SSatish Balay aa++; 32469371c9d4SSatish Balay aj++; 3247c87e5d42SMatthew Knepley } 3248c87e5d42SMatthew Knepley } 32499566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3252c87e5d42SMatthew Knepley } 3253c87e5d42SMatthew Knepley 3254ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3255d71ae5a4SJacob Faibussowitsch { 3256985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3257d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3258d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3259985db425SBarry Smith PetscScalar *x; 3260ce496241SStefano Zampini const MatScalar *aa, *av; 3261985db425SBarry Smith 3262985db425SBarry Smith PetscFunctionBegin; 326328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3265ce496241SStefano Zampini aa = av; 3266985db425SBarry Smith ai = a->i; 3267985db425SBarry Smith aj = a->j; 3268985db425SBarry Smith 32699566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32709566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32719566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 327208401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3273985db425SBarry Smith for (i = 0; i < m; i++) { 32749371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32759371c9d4SSatish Balay ai++; 3276d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32779371c9d4SSatish Balay x[i] = *aa; 32789371c9d4SSatish Balay if (idx) idx[i] = 0; 3279985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3280985db425SBarry Smith x[i] = 0.0; 3281985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3282985db425SBarry Smith for (j = 0; j < ncols; j++) { 3283985db425SBarry Smith if (aj[j] > j) { 3284985db425SBarry Smith idx[i] = j; 3285985db425SBarry Smith break; 3286985db425SBarry Smith } 3287985db425SBarry Smith } 3288fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3289fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3290985db425SBarry Smith } 3291985db425SBarry Smith } 3292985db425SBarry Smith for (j = 0; j < ncols; j++) { 32939371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32949371c9d4SSatish Balay x[i] = *aa; 32959371c9d4SSatish Balay if (idx) idx[i] = *aj; 32969371c9d4SSatish Balay } 32979371c9d4SSatish Balay aa++; 32989371c9d4SSatish Balay aj++; 3299e34fafa9SBarry Smith } 3300e34fafa9SBarry Smith } 33019566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 33029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 33033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3304e34fafa9SBarry Smith } 3305bbead8a2SBarry Smith 3306ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3307d71ae5a4SJacob Faibussowitsch { 3308bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 330933d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3310bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33110da83c2eSBarry Smith const PetscReal shift = 0.0; 33121a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3313bbead8a2SBarry Smith 3314bbead8a2SBarry Smith PetscFunctionBegin; 3315a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33164a0d0026SBarry Smith if (a->ibdiagvalid) { 33174a0d0026SBarry Smith if (values) *values = a->ibdiag; 33183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33194a0d0026SBarry Smith } 33209566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33214dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3322bbead8a2SBarry Smith diag = a->ibdiag; 3323bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3324bbead8a2SBarry Smith /* factor and invert each block */ 3325bbead8a2SBarry Smith switch (bs) { 3326bbead8a2SBarry Smith case 1: 3327bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33289566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3329ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3330ec1892c8SHong Zhang if (allowzeropivot) { 33317b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33327b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33337b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33349566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 333598921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3336ec1892c8SHong Zhang } 3337bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3338bbead8a2SBarry Smith } 3339bbead8a2SBarry Smith break; 3340bbead8a2SBarry Smith case 2: 3341bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33429371c9d4SSatish Balay ij[0] = 2 * i; 33439371c9d4SSatish Balay ij[1] = 2 * i + 1; 33449566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33467b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3348bbead8a2SBarry Smith diag += 4; 3349bbead8a2SBarry Smith } 3350bbead8a2SBarry Smith break; 3351bbead8a2SBarry Smith case 3: 3352bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33539371c9d4SSatish Balay ij[0] = 3 * i; 33549371c9d4SSatish Balay ij[1] = 3 * i + 1; 33559371c9d4SSatish Balay ij[2] = 3 * i + 2; 33569566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33587b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3360bbead8a2SBarry Smith diag += 9; 3361bbead8a2SBarry Smith } 3362bbead8a2SBarry Smith break; 3363bbead8a2SBarry Smith case 4: 3364bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33659371c9d4SSatish Balay ij[0] = 4 * i; 33669371c9d4SSatish Balay ij[1] = 4 * i + 1; 33679371c9d4SSatish Balay ij[2] = 4 * i + 2; 33689371c9d4SSatish Balay ij[3] = 4 * i + 3; 33699566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33717b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3373bbead8a2SBarry Smith diag += 16; 3374bbead8a2SBarry Smith } 3375bbead8a2SBarry Smith break; 3376bbead8a2SBarry Smith case 5: 3377bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33789371c9d4SSatish Balay ij[0] = 5 * i; 33799371c9d4SSatish Balay ij[1] = 5 * i + 1; 33809371c9d4SSatish Balay ij[2] = 5 * i + 2; 33819371c9d4SSatish Balay ij[3] = 5 * i + 3; 33829371c9d4SSatish Balay ij[4] = 5 * i + 4; 33839566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33849566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33857b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33869566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3387bbead8a2SBarry Smith diag += 25; 3388bbead8a2SBarry Smith } 3389bbead8a2SBarry Smith break; 3390bbead8a2SBarry Smith case 6: 3391bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33929371c9d4SSatish Balay ij[0] = 6 * i; 33939371c9d4SSatish Balay ij[1] = 6 * i + 1; 33949371c9d4SSatish Balay ij[2] = 6 * i + 2; 33959371c9d4SSatish Balay ij[3] = 6 * i + 3; 33969371c9d4SSatish Balay ij[4] = 6 * i + 4; 33979371c9d4SSatish Balay ij[5] = 6 * i + 5; 33989566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33999566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 34007b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3402bbead8a2SBarry Smith diag += 36; 3403bbead8a2SBarry Smith } 3404bbead8a2SBarry Smith break; 3405bbead8a2SBarry Smith case 7: 3406bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34079371c9d4SSatish Balay ij[0] = 7 * i; 34089371c9d4SSatish Balay ij[1] = 7 * i + 1; 34099371c9d4SSatish Balay ij[2] = 7 * i + 2; 34109371c9d4SSatish Balay ij[3] = 7 * i + 3; 34119371c9d4SSatish Balay ij[4] = 7 * i + 4; 34129371c9d4SSatish Balay ij[5] = 7 * i + 5; 3413cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34159566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34167b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34179566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3418bbead8a2SBarry Smith diag += 49; 3419bbead8a2SBarry Smith } 3420bbead8a2SBarry Smith break; 3421bbead8a2SBarry Smith default: 34229566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3423bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3424ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34259566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34269566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34277b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34289566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3429bbead8a2SBarry Smith diag += bs2; 3430bbead8a2SBarry Smith } 34319566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3432bbead8a2SBarry Smith } 3433bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3435bbead8a2SBarry Smith } 3436bbead8a2SBarry Smith 3437d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3438d71ae5a4SJacob Faibussowitsch { 343973a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3440fff043a9SJunchao Zhang PetscScalar a, *aa; 344173a71a0fSBarry Smith PetscInt m, n, i, j, col; 344273a71a0fSBarry Smith 344373a71a0fSBarry Smith PetscFunctionBegin; 344473a71a0fSBarry Smith if (!x->assembled) { 34459566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 344673a71a0fSBarry Smith for (i = 0; i < m; i++) { 344773a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34489566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 344973a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34509566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 345173a71a0fSBarry Smith } 345273a71a0fSBarry Smith } 3453e2ce353bSJunchao Zhang } else { 34549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34559566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3457e2ce353bSJunchao Zhang } 34589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 346173a71a0fSBarry Smith } 346273a71a0fSBarry Smith 3463679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3465d71ae5a4SJacob Faibussowitsch { 3466679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3467679944adSJunchao Zhang PetscScalar a; 3468679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3469679944adSJunchao Zhang 3470679944adSJunchao Zhang PetscFunctionBegin; 3471679944adSJunchao Zhang nskip = high - low; 34729566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3473679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3474679944adSJunchao Zhang for (i = 0; i < m; i++) { 3475679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34769566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3477679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3478679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34799566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3480679944adSJunchao Zhang } 3481e2ce353bSJunchao Zhang } 34829566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34839566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3485679944adSJunchao Zhang } 3486679944adSJunchao Zhang 34870a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3488cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3489cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3490cb5b572fSBarry Smith MatMult_SeqAIJ, 349197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34927c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34937c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3494f4259b30SLisandro Dalcin NULL, 3495f4259b30SLisandro Dalcin NULL, 3496f4259b30SLisandro Dalcin NULL, 3497f4259b30SLisandro Dalcin /* 10*/ NULL, 3498cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3499f4259b30SLisandro Dalcin NULL, 350041f059aeSBarry Smith MatSOR_SeqAIJ, 350191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 350297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3503cb5b572fSBarry Smith MatEqual_SeqAIJ, 3504cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3505cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3506cb5b572fSBarry Smith MatNorm_SeqAIJ, 3507f4259b30SLisandro Dalcin /* 20*/ NULL, 3508cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3509cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3510cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3511d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3512f4259b30SLisandro Dalcin NULL, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515f4259b30SLisandro Dalcin NULL, 351626cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3517f4259b30SLisandro Dalcin NULL, 3518f4259b30SLisandro Dalcin NULL, 3519f4259b30SLisandro Dalcin NULL, 3520f4259b30SLisandro Dalcin NULL, 3521d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3522f4259b30SLisandro Dalcin NULL, 3523f4259b30SLisandro Dalcin NULL, 3524cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3525f4259b30SLisandro Dalcin NULL, 3526d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35277dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3528cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3529cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3530cb5b572fSBarry Smith MatCopy_SeqAIJ, 3531d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3532cb5b572fSBarry Smith MatScale_SeqAIJ, 35337d68702bSBarry Smith MatShift_SeqAIJ, 353479299369SBarry Smith MatDiagonalSet_SeqAIJ, 35356e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35373b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35383b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35393b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3540a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 354193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3542f4259b30SLisandro Dalcin NULL, 3543f4259b30SLisandro Dalcin NULL, 3544cda55fadSBarry Smith MatPermute_SeqAIJ, 3545f4259b30SLisandro Dalcin NULL, 3546f4259b30SLisandro Dalcin /* 59*/ NULL, 3547b9b97703SBarry Smith MatDestroy_SeqAIJ, 3548b9b97703SBarry Smith MatView_SeqAIJ, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin /* 64*/ NULL, 3552321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3557c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin /* 74*/ NULL, 35623acb8795SBarry Smith MatFDColoringApply_AIJ, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 35666ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 3570bc011b1eSHong Zhang MatLoad_SeqAIJ, 35716cff0a6bSPierre Jolivet /* 84*/ NULL, 35726cff0a6bSPierre Jolivet NULL, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin /* 89*/ NULL, 3577f4259b30SLisandro Dalcin NULL, 357826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 3580f4259b30SLisandro Dalcin NULL, 35818fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 35846fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3585f4259b30SLisandro Dalcin NULL, 35864222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3587f4259b30SLisandro Dalcin NULL, 3588f4259b30SLisandro Dalcin NULL, 358987d4246cSBarry Smith MatConjugate_SeqAIJ, 3590f4259b30SLisandro Dalcin NULL, 3591d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 359299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3593f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 3596cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3597f4259b30SLisandro Dalcin NULL, 35982af78befSBarry Smith MatGetRowMin_SeqAIJ, 3599f4259b30SLisandro Dalcin NULL, 3600599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3601f4259b30SLisandro Dalcin /*114*/ NULL, 3602f4259b30SLisandro Dalcin NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin /*119*/ NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 3609f4259b30SLisandro Dalcin NULL, 3610b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36110716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3612a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 361337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36140da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3615f4259b30SLisandro Dalcin NULL, 3616f4259b30SLisandro Dalcin /*129*/ NULL, 3617f4259b30SLisandro Dalcin NULL, 3618f4259b30SLisandro Dalcin NULL, 361975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3620b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3621b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36222b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3623f4259b30SLisandro Dalcin NULL, 3624f4259b30SLisandro Dalcin NULL, 36253964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3626f4259b30SLisandro Dalcin /*139*/ NULL, 3627f4259b30SLisandro Dalcin NULL, 3628f4259b30SLisandro Dalcin NULL, 36293a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36309c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36314222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36324222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3633f4259b30SLisandro Dalcin NULL, 363472833a62Smarkadams4 NULL, 363572833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36362d776b49SBarry Smith NULL, 3637dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3638eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 3639eede4a3fSMark Adams MatGetRowSumAbs_SeqAIJ}; 364017ab2063SBarry Smith 3641ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3642d71ae5a4SJacob Faibussowitsch { 3643bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 364497f1f81fSBarry Smith PetscInt i, nz, n; 3645bef8e0ddSBarry Smith 3646bef8e0ddSBarry Smith PetscFunctionBegin; 3647bef8e0ddSBarry Smith nz = aij->maxnz; 3648d0f46423SBarry Smith n = mat->rmap->n; 3649ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3650bef8e0ddSBarry Smith aij->nz = nz; 3651ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3653bef8e0ddSBarry Smith } 3654bef8e0ddSBarry Smith 3655a3bb6f32SFande Kong /* 3656ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3657ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3658ddea5d60SJunchao Zhang */ 3659d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3660d71ae5a4SJacob Faibussowitsch { 3661a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3662eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3663eec179cfSJacob Faibussowitsch PetscHashIter tpos; 366425b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 366525b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3666a3bb6f32SFande Kong 3667a3bb6f32SFande Kong PetscFunctionBegin; 3668a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36694f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3670a3bb6f32SFande Kong /* use a table */ 3671eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3672a3bb6f32SFande Kong ec = 0; 367325b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367425b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3675eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3676a3bb6f32SFande Kong if (!data) { 3677a3bb6f32SFande Kong /* one based table */ 3678c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3679a3bb6f32SFande Kong } 3680a3bb6f32SFande Kong } 3681a3bb6f32SFande Kong /* form array of columns we need */ 36829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3683eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3684eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3685eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3686eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3687eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3688a3bb6f32SFande Kong gid--; 3689a3bb6f32SFande Kong lid--; 3690a3bb6f32SFande Kong garray[lid] = gid; 3691a3bb6f32SFande Kong } 36929566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3693eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3694c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3695a3bb6f32SFande Kong /* compact out the extra columns in B */ 369625b670f0SStefano Zampini for (i = 0; i < nz; i++) { 369725b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3698eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3699a3bb6f32SFande Kong lid--; 370025b670f0SStefano Zampini jj[i] = lid; 3701a3bb6f32SFande Kong } 37029566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3703eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 37049566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 37059566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 37069566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3708a3bb6f32SFande Kong } 3709a3bb6f32SFande Kong 3710bef8e0ddSBarry Smith /*@ 3711bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3712bef8e0ddSBarry Smith in the matrix. 3713bef8e0ddSBarry Smith 3714bef8e0ddSBarry Smith Input Parameters: 371511a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3716bef8e0ddSBarry Smith - indices - the column indices 3717bef8e0ddSBarry Smith 371815091d37SBarry Smith Level: advanced 371915091d37SBarry Smith 3720bef8e0ddSBarry Smith Notes: 3721bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3722bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 372311a5261eSBarry Smith of the `MatSetValues()` operation. 3724bef8e0ddSBarry Smith 3725bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 372611a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3727bef8e0ddSBarry Smith 372811a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3729bef8e0ddSBarry Smith 3730b9617806SBarry Smith The indices should start with zero, not one. 3731b9617806SBarry Smith 37321cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3733bef8e0ddSBarry Smith @*/ 3734d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3735d71ae5a4SJacob Faibussowitsch { 3736bef8e0ddSBarry Smith PetscFunctionBegin; 37370700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37384f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3739cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3741bef8e0ddSBarry Smith } 3742bef8e0ddSBarry Smith 3743ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3744d71ae5a4SJacob Faibussowitsch { 3745be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3746d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3747be6bf707SBarry Smith 3748be6bf707SBarry Smith PetscFunctionBegin; 374928b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3750be6bf707SBarry Smith 3751be6bf707SBarry Smith /* allocate space for values if not already there */ 37524dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3753be6bf707SBarry Smith 3754be6bf707SBarry Smith /* copy values over */ 37559566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3757be6bf707SBarry Smith } 3758be6bf707SBarry Smith 3759be6bf707SBarry Smith /*@ 376020f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3761be6bf707SBarry Smith nonlinear portion. 3762be6bf707SBarry Smith 3763c3339decSBarry Smith Logically Collect 3764be6bf707SBarry Smith 376527430b45SBarry Smith Input Parameter: 376611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3767be6bf707SBarry Smith 376815091d37SBarry Smith Level: advanced 376915091d37SBarry Smith 37702920cce0SJacob Faibussowitsch Example Usage: 377127430b45SBarry Smith .vb 37722ef1f0ffSBarry Smith Using SNES 377327430b45SBarry Smith Create Jacobian matrix 377427430b45SBarry Smith Set linear terms into matrix 377527430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 377627430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 377727430b45SBarry Smith boundary conditions again will not change the nonzero structure 377827430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377927430b45SBarry Smith MatStoreValues(mat); 378027430b45SBarry Smith Call SNESSetJacobian() with matrix 378127430b45SBarry Smith In your Jacobian routine 378227430b45SBarry Smith MatRetrieveValues(mat); 378327430b45SBarry Smith Set nonlinear terms in matrix 3784be6bf707SBarry Smith 378527430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 378627430b45SBarry Smith // build linear portion of Jacobian 378727430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378827430b45SBarry Smith MatStoreValues(mat); 378927430b45SBarry Smith loop over nonlinear iterations 379027430b45SBarry Smith MatRetrieveValues(mat); 379127430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 379227430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 379327430b45SBarry Smith Solve linear system with Jacobian 379427430b45SBarry Smith endloop 379527430b45SBarry Smith .ve 3796be6bf707SBarry Smith 3797be6bf707SBarry Smith Notes: 3798da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 379911a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3800be6bf707SBarry Smith calling this routine. 3801be6bf707SBarry Smith 38020c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38030c468ba9SBarry Smith and does not allocated additional space. 38040c468ba9SBarry Smith 3805fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3806be6bf707SBarry Smith @*/ 3807d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3808d71ae5a4SJacob Faibussowitsch { 3809be6bf707SBarry Smith PetscFunctionBegin; 38100700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 381128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 381228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3813cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3815be6bf707SBarry Smith } 3816be6bf707SBarry Smith 3817ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3818d71ae5a4SJacob Faibussowitsch { 3819be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3820d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3821be6bf707SBarry Smith 3822be6bf707SBarry Smith PetscFunctionBegin; 382328b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 382428b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3825be6bf707SBarry Smith /* copy values over */ 38269566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3828be6bf707SBarry Smith } 3829be6bf707SBarry Smith 3830be6bf707SBarry Smith /*@ 383120f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3832be6bf707SBarry Smith 3833c3339decSBarry Smith Logically Collect 3834be6bf707SBarry Smith 38352fe279fdSBarry Smith Input Parameter: 383611a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3837be6bf707SBarry Smith 383815091d37SBarry Smith Level: advanced 383915091d37SBarry Smith 38401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3841be6bf707SBarry Smith @*/ 3842d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3843d71ae5a4SJacob Faibussowitsch { 3844be6bf707SBarry Smith PetscFunctionBegin; 38450700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 384628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 384728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3848cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3850be6bf707SBarry Smith } 3851be6bf707SBarry Smith 3852*5d83a8b1SBarry Smith /*@ 385311a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38540d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 385520f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 385620f4b53cSBarry Smith (or the array `nnz`). 385717ab2063SBarry Smith 3858d083f849SBarry Smith Collective 3859db81eaa0SLois Curfman McInnes 386017ab2063SBarry Smith Input Parameters: 386111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 386217ab2063SBarry Smith . m - number of rows 386317ab2063SBarry Smith . n - number of columns 386417ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 386551c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38660298fd71SBarry Smith (possibly different for each row) or NULL 386717ab2063SBarry Smith 386817ab2063SBarry Smith Output Parameter: 3869416022c9SBarry Smith . A - the matrix 387017ab2063SBarry Smith 38712ef1f0ffSBarry Smith Options Database Keys: 38722ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38732ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38742ef1f0ffSBarry Smith 38752ef1f0ffSBarry Smith Level: intermediate 3876175b88e8SBarry Smith 3877b259b22eSLois Curfman McInnes Notes: 387877433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 387977433607SBarry Smith 38802ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 388149a6f317SBarry Smith 38822ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38832ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38840002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38852ef1f0ffSBarry Smith either one (as in Fortran) or zero. 388617ab2063SBarry Smith 388720f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38882ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 388920f4b53cSBarry Smith allocation. 389017ab2063SBarry Smith 3891682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38924fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3893682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38946c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38956c7ebb05SLois Curfman McInnes 38961cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 389717ab2063SBarry Smith @*/ 3898d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3899d71ae5a4SJacob Faibussowitsch { 39003a40ed3dSBarry Smith PetscFunctionBegin; 39019566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 39029566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 39039566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 39049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 39053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3906273d9f13SBarry Smith } 3907273d9f13SBarry Smith 3908*5d83a8b1SBarry Smith /*@ 3909273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3910273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3911273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3912273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3913273d9f13SBarry Smith 3914d083f849SBarry Smith Collective 3915273d9f13SBarry Smith 3916273d9f13SBarry Smith Input Parameters: 39171c4f3114SJed Brown + B - The matrix 3918273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3919273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39200298fd71SBarry Smith (possibly different for each row) or NULL 3921273d9f13SBarry Smith 39222ef1f0ffSBarry Smith Options Database Keys: 39232ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39242ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39252ef1f0ffSBarry Smith 39262ef1f0ffSBarry Smith Level: intermediate 39272ef1f0ffSBarry Smith 3928273d9f13SBarry Smith Notes: 39292ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 393049a6f317SBarry Smith 393111a5261eSBarry Smith The `MATSEQAIJ` format also called 39322ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3933273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3934273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3935273d9f13SBarry Smith 39362ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39372ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39382ef1f0ffSBarry Smith allocation. 3939273d9f13SBarry Smith 394011a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3941aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3942aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3943aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3944aa95bbe8SBarry Smith 394511a5261eSBarry Smith Developer Notes: 394611a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3947a96a251dSBarry Smith entries or columns indices 3948a96a251dSBarry Smith 3949273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3950273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3951273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3952273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3953273d9f13SBarry Smith 39541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3955db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3956273d9f13SBarry Smith @*/ 3957d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3958d71ae5a4SJacob Faibussowitsch { 3959a23d5eceSKris Buschelman PetscFunctionBegin; 39606ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39616ba663aaSJed Brown PetscValidType(B, 1); 3962cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3964a23d5eceSKris Buschelman } 3965a23d5eceSKris Buschelman 3966d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3967d71ae5a4SJacob Faibussowitsch { 3968ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39692576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 397097f1f81fSBarry Smith PetscInt i; 3971273d9f13SBarry Smith 3972273d9f13SBarry Smith PetscFunctionBegin; 3973ad79cf63SBarry Smith if (B->hash_active) { 3974aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3975ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3976ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3977ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3978ad79cf63SBarry Smith } 39792576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3980a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3981c461c341SBarry Smith skipallocation = PETSC_TRUE; 3982c461c341SBarry Smith nz = 0; 3983c461c341SBarry Smith } 39849566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3986899cda47SBarry Smith 3987435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 398808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3989cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3990d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 399108401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 399208401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3993b73539f3SBarry Smith } 3994b73539f3SBarry Smith } 3995b73539f3SBarry Smith 3996273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3997ab93d7beSBarry Smith if (!skipallocation) { 39984dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3999071fcb05SBarry Smith if (!b->ilen) { 4000071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 4002071fcb05SBarry Smith } else { 40039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 40042ee49352SLisandro Dalcin } 4005aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 4006273d9f13SBarry Smith if (!nnz) { 4007435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4008c62bd62aSJed Brown else if (nz < 0) nz = 1; 40095d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4010d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4011c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4012273d9f13SBarry Smith } else { 4013c73702f5SBarry Smith PetscInt64 nz64 = 0; 40149371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40159371c9d4SSatish Balay b->imax[i] = nnz[i]; 40169371c9d4SSatish Balay nz64 += nnz[i]; 40179371c9d4SSatish Balay } 40189566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4019273d9f13SBarry Smith } 4020ab93d7beSBarry Smith 4021273d9f13SBarry Smith /* allocate the matrix space */ 402253dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40239566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4024396832f4SHong Zhang if (B->structure_only) { 40259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4027396832f4SHong Zhang } else { 40289566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4029396832f4SHong Zhang } 4030bfeeae90SHong Zhang b->i[0] = 0; 4031ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4032396832f4SHong Zhang if (B->structure_only) { 4033396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4034396832f4SHong Zhang b->free_a = PETSC_FALSE; 4035396832f4SHong Zhang } else { 4036273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4037e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4038396832f4SHong Zhang } 4039e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4040c461c341SBarry Smith } else { 4041e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4042e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4043c461c341SBarry Smith } 4044273d9f13SBarry Smith 4045846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4046846b4da1SFande Kong /* reserve user-requested sparsity */ 40479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4048846b4da1SFande Kong } 4049846b4da1SFande Kong 4050273d9f13SBarry Smith b->nz = 0; 4051273d9f13SBarry Smith b->maxnz = nz; 4052273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40531baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4054cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4055cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40565519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40575519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40585519a089SJose E. Roman */ 40595519a089SJose E. Roman B->nonzerostate++; 40603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4061273d9f13SBarry Smith } 4062273d9f13SBarry Smith 4063ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4064d71ae5a4SJacob Faibussowitsch { 4065846b4da1SFande Kong Mat_SeqAIJ *a; 4066a5bbaf83SFande Kong PetscInt i; 40671f14be2bSBarry Smith PetscBool skipreset; 4068846b4da1SFande Kong 4069846b4da1SFande Kong PetscFunctionBegin; 4070846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 407114d0e64fSAlex Lindsay 407214d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40733ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 407414d0e64fSAlex Lindsay 4075846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40762c814fdeSFande Kong /* if no saved info, we error out */ 407728b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40782c814fdeSFande Kong 40791f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40802c814fdeSFande Kong 40811f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40821f14be2bSBarry Smith if (!skipreset) { 40839566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40849566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4085846b4da1SFande Kong a->i[0] = 0; 4086ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4087846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4088846b4da1SFande Kong a->nz = 0; 4089846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4090846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4091846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4092846b4da1SFande Kong A->assembled = PETSC_FALSE; 40931f14be2bSBarry Smith } 40943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4095846b4da1SFande Kong } 4096846b4da1SFande Kong 409758d36128SBarry Smith /*@ 409811a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4099a1661176SMatthew Knepley 4100a1661176SMatthew Knepley Input Parameters: 4101a1661176SMatthew Knepley + B - the matrix 4102d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4103d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4104d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4105a1661176SMatthew Knepley 4106a1661176SMatthew Knepley Level: developer 4107a1661176SMatthew Knepley 41086a9b8d82SBarry Smith Notes: 41092ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 411058d36128SBarry Smith 41116a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41126a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41136a9b8d82SBarry Smith 41146a9b8d82SBarry Smith Developer Notes: 41152ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41162ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41176a9b8d82SBarry Smith 411811a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41196a9b8d82SBarry Smith 4120fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4121a1661176SMatthew Knepley @*/ 4122d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4123d71ae5a4SJacob Faibussowitsch { 4124a1661176SMatthew Knepley PetscFunctionBegin; 41250700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41266ba663aaSJed Brown PetscValidType(B, 1); 4127cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4129a1661176SMatthew Knepley } 4130a1661176SMatthew Knepley 4131ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4132d71ae5a4SJacob Faibussowitsch { 4133a1661176SMatthew Knepley PetscInt i; 4134a1661176SMatthew Knepley PetscInt m, n; 4135a1661176SMatthew Knepley PetscInt nz; 41366a9b8d82SBarry Smith PetscInt *nnz; 4137a1661176SMatthew Knepley 4138a1661176SMatthew Knepley PetscFunctionBegin; 4139aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4140779a8d59SSatish Balay 41419566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41429566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4143779a8d59SSatish Balay 41449566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41459566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4146a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4147b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 414808401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4149a1661176SMatthew Knepley nnz[i] = nz; 4150a1661176SMatthew Knepley } 41519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41529566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4153a1661176SMatthew Knepley 41548e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4155a1661176SMatthew Knepley 41569566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41579566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4158a1661176SMatthew Knepley 41599566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4161a1661176SMatthew Knepley } 4162a1661176SMatthew Knepley 4163ad7e164aSPierre Jolivet /*@ 41642ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4165ad7e164aSPierre Jolivet 4166ad7e164aSPierre Jolivet Input Parameters: 4167ad7e164aSPierre Jolivet + A - left-hand side matrix 4168ad7e164aSPierre Jolivet . B - right-hand side matrix 416911a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4170ad7e164aSPierre Jolivet 4171ad7e164aSPierre Jolivet Output Parameter: 41722ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4173ad7e164aSPierre Jolivet 4174ad7e164aSPierre Jolivet Level: intermediate 4175ad7e164aSPierre Jolivet 417611a5261eSBarry Smith Note: 417711a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4178ad7e164aSPierre Jolivet 41791cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4180ad7e164aSPierre Jolivet @*/ 4181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4182d71ae5a4SJacob Faibussowitsch { 4183ad7e164aSPierre Jolivet PetscFunctionBegin; 4184ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4185ad7e164aSPierre Jolivet PetscValidType(A, 1); 4186ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4187ad7e164aSPierre Jolivet PetscValidType(B, 2); 41884f572ea9SToby Isaac PetscAssertPointer(C, 4); 4189ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4190ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4191ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4192ad7e164aSPierre Jolivet } 4193cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4195ad7e164aSPierre Jolivet } 4196ad7e164aSPierre Jolivet 4197ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4198d71ae5a4SJacob Faibussowitsch { 4199ad7e164aSPierre Jolivet Mat newmat; 4200ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4201ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4202ad7e164aSPierre Jolivet PetscScalar *v; 4203fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4204ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4205ad7e164aSPierre Jolivet PetscBool flg; 4206ad7e164aSPierre Jolivet 4207ad7e164aSPierre Jolivet PetscFunctionBegin; 420828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420928b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 421028b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421128b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42129566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 421328b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4214aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4215ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42169566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42179566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42189566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42199566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4220ad7e164aSPierre Jolivet i[0] = 0; 4221ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4222ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4223ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4224ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4225ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4226ad7e164aSPierre Jolivet } 4227ad7e164aSPierre Jolivet } 4228ad7e164aSPierre Jolivet } 42299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4230ad7e164aSPierre Jolivet *C = newmat; 42319566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4232ad7e164aSPierre Jolivet nnz = 0; 4233ad7e164aSPierre Jolivet } 42349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4237ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4238ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4239ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4240ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4241ad7e164aSPierre Jolivet } 4242ad7e164aSPierre Jolivet } 4243ad7e164aSPierre Jolivet } 42449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4248ad7e164aSPierre Jolivet } 4249ad7e164aSPierre Jolivet 4250c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4251af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4252170fe5c8SBarry Smith 4253170fe5c8SBarry Smith /* 4254170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4255170fe5c8SBarry Smith 4256170fe5c8SBarry Smith n p p 42572da392ccSBarry Smith [ ] [ ] [ ] 42582da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42592da392ccSBarry Smith [ ] [ ] [ ] 4260170fe5c8SBarry Smith 4261170fe5c8SBarry Smith */ 4262d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4263d71ae5a4SJacob Faibussowitsch { 4264170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4265170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4266170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 426786214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4268170fe5c8SBarry Smith const PetscInt *ii, *idx; 4269170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4270170fe5c8SBarry Smith PetscScalar *c, *c_q; 427186214ceeSStefano Zampini PetscInt clda = sub_c->lda; 427286214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4273170fe5c8SBarry Smith 4274170fe5c8SBarry Smith PetscFunctionBegin; 4275d0f46423SBarry Smith m = A->rmap->n; 4276d0f46423SBarry Smith n = A->cmap->n; 4277d0f46423SBarry Smith p = B->cmap->n; 4278170fe5c8SBarry Smith a = sub_a->v; 4279170fe5c8SBarry Smith b = sub_b->a; 4280170fe5c8SBarry Smith c = sub_c->v; 428186214ceeSStefano Zampini if (clda == m) { 42829566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 428386214ceeSStefano Zampini } else { 428486214ceeSStefano Zampini for (j = 0; j < p; j++) 42859371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 428686214ceeSStefano Zampini } 4287170fe5c8SBarry Smith ii = sub_b->i; 4288170fe5c8SBarry Smith idx = sub_b->j; 4289170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4290170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4291170fe5c8SBarry Smith while (q-- > 0) { 429286214ceeSStefano Zampini c_q = c + clda * (*idx); 429386214ceeSStefano Zampini a_q = a + alda * i; 4294854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4295170fe5c8SBarry Smith idx++; 4296170fe5c8SBarry Smith b++; 4297170fe5c8SBarry Smith } 4298170fe5c8SBarry Smith } 42993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4300170fe5c8SBarry Smith } 4301170fe5c8SBarry Smith 4302d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4303d71ae5a4SJacob Faibussowitsch { 4304d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 430586214ceeSStefano Zampini PetscBool cisdense; 4306170fe5c8SBarry Smith 4307170fe5c8SBarry Smith PetscFunctionBegin; 430808401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43099566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43109566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4311d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 431248a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43139566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4314d73949e8SHong Zhang 43154222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4317170fe5c8SBarry Smith } 4318170fe5c8SBarry Smith 43190bad9183SKris Buschelman /*MC 4320fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43210bad9183SKris Buschelman based on compressed sparse row format. 43220bad9183SKris Buschelman 43232ef1f0ffSBarry Smith Options Database Key: 43240bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43250bad9183SKris Buschelman 43260bad9183SKris Buschelman Level: beginner 43270bad9183SKris Buschelman 43280cd7f59aSBarry Smith Notes: 43292ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43300cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43310cd7f59aSBarry Smith in the matrix 43320cd7f59aSBarry Smith 433311a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 433411a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43350cd7f59aSBarry Smith 433611a5261eSBarry Smith Developer Note: 43372ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43380cd7f59aSBarry Smith 43391cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43400bad9183SKris Buschelman M*/ 43410bad9183SKris Buschelman 4342ccd284c7SBarry Smith /*MC 4343ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4344ccd284c7SBarry Smith 434511a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 434611a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 434711a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4348ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4349ccd284c7SBarry Smith the above preallocation routines for simplicity. 4350ccd284c7SBarry Smith 43512ef1f0ffSBarry Smith Options Database Key: 435211a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4353ccd284c7SBarry Smith 43542ef1f0ffSBarry Smith Level: beginner 43552ef1f0ffSBarry Smith 435611a5261eSBarry Smith Note: 435711a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4358ccd284c7SBarry Smith enough exist. 4359ccd284c7SBarry Smith 43601cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4361ccd284c7SBarry Smith M*/ 4362ccd284c7SBarry Smith 4363ccd284c7SBarry Smith /*MC 4364ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4365ccd284c7SBarry Smith 43662ef1f0ffSBarry Smith Options Database Key: 43672ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43682ef1f0ffSBarry Smith 43692ef1f0ffSBarry Smith Level: beginner 43702ef1f0ffSBarry Smith 43712ef1f0ffSBarry Smith Note: 437211a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 437311a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 437411a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4375ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4376ccd284c7SBarry Smith the above preallocation routines for simplicity. 4377ccd284c7SBarry Smith 43781cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4379ccd284c7SBarry Smith M*/ 4380ccd284c7SBarry Smith 43817906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43827906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43837906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43847906f579SHong Zhang #endif 4385d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4386d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4387d24d4204SJose E. Roman #endif 43887906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43897906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43907906f579SHong Zhang #endif 43917906f579SHong Zhang 4392d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4393c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43944222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43957906f579SHong Zhang 43968c778c55SBarry Smith /*@C 439711a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43988c778c55SBarry Smith 43998c778c55SBarry Smith Not Collective 44008c778c55SBarry Smith 44018c778c55SBarry Smith Input Parameter: 4402fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44038c778c55SBarry Smith 44048c778c55SBarry Smith Output Parameter: 44058c778c55SBarry Smith . array - pointer to the data 44068c778c55SBarry Smith 44078c778c55SBarry Smith Level: intermediate 44088c778c55SBarry Smith 4409fe59aa6dSJacob Faibussowitsch Fortran Notes: 44100ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44110ab4885dSBarry Smith 44121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44138c778c55SBarry Smith @*/ 4414*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4415d71ae5a4SJacob Faibussowitsch { 4416d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44178c778c55SBarry Smith 44188c778c55SBarry Smith PetscFunctionBegin; 4419d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44209566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4421d67d9f35SJunchao Zhang } else { 4422d67d9f35SJunchao Zhang *array = aij->a; 4423d67d9f35SJunchao Zhang } 44243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4425d67d9f35SJunchao Zhang } 4426d67d9f35SJunchao Zhang 4427d67d9f35SJunchao Zhang /*@C 442811a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4429d67d9f35SJunchao Zhang 4430d67d9f35SJunchao Zhang Not Collective 4431d67d9f35SJunchao Zhang 4432d67d9f35SJunchao Zhang Input Parameters: 4433fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4434d67d9f35SJunchao Zhang - array - pointer to the data 4435d67d9f35SJunchao Zhang 4436d67d9f35SJunchao Zhang Level: intermediate 4437d67d9f35SJunchao Zhang 4438fe59aa6dSJacob Faibussowitsch Fortran Notes: 44390ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44400ab4885dSBarry Smith 44411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4442d67d9f35SJunchao Zhang @*/ 4443*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4444d71ae5a4SJacob Faibussowitsch { 4445d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4446d67d9f35SJunchao Zhang 4447d67d9f35SJunchao Zhang PetscFunctionBegin; 4448d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44499566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4450d67d9f35SJunchao Zhang } else { 4451d67d9f35SJunchao Zhang *array = NULL; 4452d67d9f35SJunchao Zhang } 44539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44549566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44568c778c55SBarry Smith } 44578c778c55SBarry Smith 445821e72a00SBarry Smith /*@C 445911a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44608f1ea47aSStefano Zampini 44610ab4885dSBarry Smith Not Collective; No Fortran Support 44628f1ea47aSStefano Zampini 44638f1ea47aSStefano Zampini Input Parameter: 4464fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44658f1ea47aSStefano Zampini 44668f1ea47aSStefano Zampini Output Parameter: 44678f1ea47aSStefano Zampini . array - pointer to the data 44688f1ea47aSStefano Zampini 44698f1ea47aSStefano Zampini Level: intermediate 44708f1ea47aSStefano Zampini 44711cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44728f1ea47aSStefano Zampini @*/ 4473*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4474d71ae5a4SJacob Faibussowitsch { 4475d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44768f1ea47aSStefano Zampini 44778f1ea47aSStefano Zampini PetscFunctionBegin; 4478d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44799566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4480d67d9f35SJunchao Zhang } else { 4481d67d9f35SJunchao Zhang *array = aij->a; 4482d67d9f35SJunchao Zhang } 44833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44848f1ea47aSStefano Zampini } 44858f1ea47aSStefano Zampini 44868f1ea47aSStefano Zampini /*@C 448711a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44888f1ea47aSStefano Zampini 44890ab4885dSBarry Smith Not Collective; No Fortran Support 44908f1ea47aSStefano Zampini 44918f1ea47aSStefano Zampini Input Parameter: 4492fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44938f1ea47aSStefano Zampini 44948f1ea47aSStefano Zampini Output Parameter: 44958f1ea47aSStefano Zampini . array - pointer to the data 44968f1ea47aSStefano Zampini 44978f1ea47aSStefano Zampini Level: intermediate 44988f1ea47aSStefano Zampini 44991cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45008f1ea47aSStefano Zampini @*/ 4501*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4502d71ae5a4SJacob Faibussowitsch { 4503d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 45048f1ea47aSStefano Zampini 45058f1ea47aSStefano Zampini PetscFunctionBegin; 4506d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45079566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4508d67d9f35SJunchao Zhang } else { 4509d67d9f35SJunchao Zhang *array = NULL; 4510d67d9f35SJunchao Zhang } 45113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4512d67d9f35SJunchao Zhang } 4513d67d9f35SJunchao Zhang 4514d67d9f35SJunchao Zhang /*@C 451511a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4516d67d9f35SJunchao Zhang 45170ab4885dSBarry Smith Not Collective; No Fortran Support 4518d67d9f35SJunchao Zhang 4519d67d9f35SJunchao Zhang Input Parameter: 4520fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4521d67d9f35SJunchao Zhang 4522d67d9f35SJunchao Zhang Output Parameter: 4523d67d9f35SJunchao Zhang . array - pointer to the data 4524d67d9f35SJunchao Zhang 4525d67d9f35SJunchao Zhang Level: intermediate 4526d67d9f35SJunchao Zhang 45271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4528d67d9f35SJunchao Zhang @*/ 4529*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4530d71ae5a4SJacob Faibussowitsch { 4531d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4532d67d9f35SJunchao Zhang 4533d67d9f35SJunchao Zhang PetscFunctionBegin; 4534d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45359566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4536d67d9f35SJunchao Zhang } else { 4537d67d9f35SJunchao Zhang *array = aij->a; 4538d67d9f35SJunchao Zhang } 45399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45409566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4542d67d9f35SJunchao Zhang } 4543d67d9f35SJunchao Zhang 4544d67d9f35SJunchao Zhang /*@C 4545d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4546d67d9f35SJunchao Zhang 45470ab4885dSBarry Smith Not Collective; No Fortran Support 4548d67d9f35SJunchao Zhang 4549d67d9f35SJunchao Zhang Input Parameter: 4550fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4551d67d9f35SJunchao Zhang 4552d67d9f35SJunchao Zhang Output Parameter: 4553d67d9f35SJunchao Zhang . array - pointer to the data 4554d67d9f35SJunchao Zhang 4555d67d9f35SJunchao Zhang Level: intermediate 4556d67d9f35SJunchao Zhang 45571cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4558d67d9f35SJunchao Zhang @*/ 4559*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4560d71ae5a4SJacob Faibussowitsch { 4561d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4562d67d9f35SJunchao Zhang 4563d67d9f35SJunchao Zhang PetscFunctionBegin; 4564d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45659566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4566d67d9f35SJunchao Zhang } else { 4567d67d9f35SJunchao Zhang *array = NULL; 4568d67d9f35SJunchao Zhang } 45693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45708f1ea47aSStefano Zampini } 45718f1ea47aSStefano Zampini 45728f1ea47aSStefano Zampini /*@C 457311a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45747ee59b9bSJunchao Zhang 45750ab4885dSBarry Smith Not Collective; No Fortran Support 45767ee59b9bSJunchao Zhang 45777ee59b9bSJunchao Zhang Input Parameter: 457811a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45797ee59b9bSJunchao Zhang 45807ee59b9bSJunchao Zhang Output Parameters: 45817ee59b9bSJunchao Zhang + i - row map array of the matrix 45827ee59b9bSJunchao Zhang . j - column index array of the matrix 45837ee59b9bSJunchao Zhang . a - data array of the matrix 4584fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45857ee59b9bSJunchao Zhang 4586fe59aa6dSJacob Faibussowitsch Level: developer 45872ef1f0ffSBarry Smith 45887ee59b9bSJunchao Zhang Notes: 45892ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45907ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45917ee59b9bSJunchao Zhang 45927ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45932ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45947ee59b9bSJunchao Zhang 45951cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45967ee59b9bSJunchao Zhang @*/ 4597*5d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4598d71ae5a4SJacob Faibussowitsch { 45997ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 46007ee59b9bSJunchao Zhang 46017ee59b9bSJunchao Zhang PetscFunctionBegin; 46027ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 46037ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46047ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 46057ee59b9bSJunchao Zhang } else { 46067ee59b9bSJunchao Zhang if (i) *i = aij->i; 46077ee59b9bSJunchao Zhang if (j) *j = aij->j; 46087ee59b9bSJunchao Zhang if (a) *a = aij->a; 46097ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46107ee59b9bSJunchao Zhang } 46113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46127ee59b9bSJunchao Zhang } 46137ee59b9bSJunchao Zhang 4614cc4c1da9SBarry Smith /*@ 461521e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 461621e72a00SBarry Smith 461721e72a00SBarry Smith Not Collective 461821e72a00SBarry Smith 461921e72a00SBarry Smith Input Parameter: 4620fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 462121e72a00SBarry Smith 462221e72a00SBarry Smith Output Parameter: 462321e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 462421e72a00SBarry Smith 462521e72a00SBarry Smith Level: intermediate 462621e72a00SBarry Smith 46271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 462821e72a00SBarry Smith @*/ 4629d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4630d71ae5a4SJacob Faibussowitsch { 463121e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 463221e72a00SBarry Smith 463321e72a00SBarry Smith PetscFunctionBegin; 463421e72a00SBarry Smith *nz = aij->rmax; 46353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 463621e72a00SBarry Smith } 463721e72a00SBarry Smith 46382c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46392c4ab24aSJunchao Zhang { 46402c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46414d86920dSPierre Jolivet 46422c4ab24aSJunchao Zhang PetscFunctionBegin; 46432c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46442c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46452c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46462c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46472c4ab24aSJunchao Zhang } 46482c4ab24aSJunchao Zhang 4649d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4650d71ae5a4SJacob Faibussowitsch { 4651394ed5ebSJunchao Zhang MPI_Comm comm; 4652394ed5ebSJunchao Zhang PetscInt *i, *j; 46530d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4654394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4655394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4656394ed5ebSJunchao Zhang PetscInt *Aj; 4657394ed5ebSJunchao Zhang PetscScalar *Aa; 4658f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4659cbc6b225SStefano Zampini MatType rtype; 4660394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46612c4ab24aSJunchao Zhang PetscContainer container; 46622c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46630d88f7f4SJunchao Zhang PetscBool isorted; 4664394ed5ebSJunchao Zhang 4665394ed5ebSJunchao Zhang PetscFunctionBegin; 46669566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46679566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4668e8729f6fSJunchao Zhang i = coo_i; 4669e8729f6fSJunchao Zhang j = coo_j; 46709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46710d88f7f4SJunchao Zhang 46720d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46730d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46740d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46750d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4676394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46770d88f7f4SJunchao Zhang if (isorted) { 46780d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46790d88f7f4SJunchao Zhang else iprev = i[k]; 46800d88f7f4SJunchao Zhang } 4681394ed5ebSJunchao Zhang perm[k] = k; 4682394ed5ebSJunchao Zhang } 4683394ed5ebSJunchao Zhang 46840d88f7f4SJunchao Zhang /* Sort by row if not already */ 46850d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4686651b1cf9SStefano Zampini 4687651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4688651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46899371c9d4SSatish Balay if (i[k] >= 0) break; 4690394ed5ebSJunchao Zhang nneg = k; 46919566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4692394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 469335cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4694394ed5ebSJunchao Zhang 46959566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46969566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4697394ed5ebSJunchao Zhang 4698651b1cf9SStefano Zampini /* Support for HYPRE */ 4699651b1cf9SStefano Zampini PetscBool hypre; 4700651b1cf9SStefano Zampini const char *name; 4701651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4702651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4703651b1cf9SStefano Zampini 4704394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 470535cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4706394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4707394ed5ebSJunchao Zhang while (k < coo_n) { 47080d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47090d88f7f4SJunchao Zhang PetscInt jprev; 47100d88f7f4SJunchao Zhang 47110d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4712394ed5ebSJunchao Zhang row = i[k]; 47130d88f7f4SJunchao Zhang start = k; 47140d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47150d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47160d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47170d88f7f4SJunchao Zhang if (strictly_sorted) { 47180d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47190d88f7f4SJunchao Zhang else jprev = j[k]; 47200d88f7f4SJunchao Zhang } 47210d88f7f4SJunchao Zhang k++; 47220d88f7f4SJunchao Zhang } 4723394ed5ebSJunchao Zhang end = k; 47240d88f7f4SJunchao Zhang 4725651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4726651b1cf9SStefano Zampini if (hypre) { 4727651b1cf9SStefano Zampini PetscInt minj = PETSC_MAX_INT; 4728651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47290d88f7f4SJunchao Zhang 47300d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47310d88f7f4SJunchao Zhang PetscCount tmp; 47320d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47330d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47340d88f7f4SJunchao Zhang j[p] = j[start]; 47350d88f7f4SJunchao Zhang j[start] = row; 47360d88f7f4SJunchao Zhang tmp = perm[start]; 47370d88f7f4SJunchao Zhang perm[start] = perm[p]; 47380d88f7f4SJunchao Zhang perm[p] = tmp; 47390d88f7f4SJunchao Zhang break; 47400d88f7f4SJunchao Zhang } 47410d88f7f4SJunchao Zhang } 47420d88f7f4SJunchao Zhang } else { 4743651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4744651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4745651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4746651b1cf9SStefano Zampini } 47470d88f7f4SJunchao Zhang 4748651b1cf9SStefano Zampini if (hasdiag) { 4749651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4750651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4751651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4752651b1cf9SStefano Zampini } 4753651b1cf9SStefano Zampini } 4754651b1cf9SStefano Zampini } 47550d88f7f4SJunchao Zhang } 47560d88f7f4SJunchao Zhang // sort by columns in a row 47570d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4758651b1cf9SStefano Zampini 47590d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47600d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47610d88f7f4SJunchao Zhang Aj[q] = j[p]; 47620d88f7f4SJunchao Zhang jmap[q] = 1; 47630d88f7f4SJunchao Zhang } 47640d88f7f4SJunchao Zhang Ai[row] = end - start; 47650d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47660d88f7f4SJunchao Zhang } else { 4767394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4768394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4769651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4770394ed5ebSJunchao Zhang Ai[row] = 1; 4771394ed5ebSJunchao Zhang nnz++; 4772394ed5ebSJunchao Zhang 4773394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4774394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4775394ed5ebSJunchao Zhang q++; 4776394ed5ebSJunchao Zhang jmap[q] = 1; 4777394ed5ebSJunchao Zhang Aj[q] = j[p]; 4778394ed5ebSJunchao Zhang Ai[row]++; 4779394ed5ebSJunchao Zhang nnz++; 4780394ed5ebSJunchao Zhang } else { 4781394ed5ebSJunchao Zhang jmap[q]++; 4782394ed5ebSJunchao Zhang } 4783394ed5ebSJunchao Zhang } 4784394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4785394ed5ebSJunchao Zhang } 47860d88f7f4SJunchao Zhang } 47870d88f7f4SJunchao Zhang 4788394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4789394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47900d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4791394ed5ebSJunchao Zhang jmap[0] = 0; 4792394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47930d88f7f4SJunchao Zhang 4794394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4795394ed5ebSJunchao Zhang PetscCount *jmap_new; 4796394ed5ebSJunchao Zhang PetscInt *Aj_new; 4797394ed5ebSJunchao Zhang 47989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 48009566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4801394ed5ebSJunchao Zhang jmap = jmap_new; 4802394ed5ebSJunchao Zhang 48039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 48049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 48059566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4806394ed5ebSJunchao Zhang Aj = Aj_new; 4807394ed5ebSJunchao Zhang } 4808394ed5ebSJunchao Zhang 4809394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4810394ed5ebSJunchao Zhang PetscCount *perm_new; 4811cbc6b225SStefano Zampini 48129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48139566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48149566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4815394ed5ebSJunchao Zhang perm = perm_new; 4816394ed5ebSJunchao Zhang } 4817394ed5ebSJunchao Zhang 48189566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 48209566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4821394ed5ebSJunchao Zhang 4822394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4823394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48242c4ab24aSJunchao Zhang 48252c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48262c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48272c4ab24aSJunchao Zhang coo->nz = nnz; 48282c4ab24aSJunchao Zhang coo->n = coo_n; 48292c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48302c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48312c4ab24aSJunchao Zhang coo->perm = perm; 48322c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 48332c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 48342c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 48352c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 48362c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 48373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4838394ed5ebSJunchao Zhang } 4839394ed5ebSJunchao Zhang 4840d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4841d71ae5a4SJacob Faibussowitsch { 4842394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4843394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48442c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4845394ed5ebSJunchao Zhang PetscScalar *Aa; 48462c4ab24aSJunchao Zhang PetscContainer container; 48472c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4848394ed5ebSJunchao Zhang 4849394ed5ebSJunchao Zhang PetscFunctionBegin; 48502c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48512c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48522c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48532c4ab24aSJunchao Zhang perm = coo->perm; 48542c4ab24aSJunchao Zhang jmap = coo->jmap; 48559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4856394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4857b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4858b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4859b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4860394ed5ebSJunchao Zhang } 48619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4863394ed5ebSJunchao Zhang } 4864394ed5ebSJunchao Zhang 486534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48665063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 486702fe1965SBarry Smith #endif 4868d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4869d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4870d5e393b6SSuyash Tandon #endif 48713d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48725063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48733d0639e7SStefano Zampini #endif 487402fe1965SBarry Smith 4875d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4876d71ae5a4SJacob Faibussowitsch { 4877273d9f13SBarry Smith Mat_SeqAIJ *b; 487838baddfdSBarry Smith PetscMPIInt size; 4879273d9f13SBarry Smith 4880273d9f13SBarry Smith PetscFunctionBegin; 48819566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 488208401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4883273d9f13SBarry Smith 48844dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48852205254eSKarl Rupp 4886b0a32e0cSBarry Smith B->data = (void *)b; 4887aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4888071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48892205254eSKarl Rupp 4890f4259b30SLisandro Dalcin b->row = NULL; 4891f4259b30SLisandro Dalcin b->col = NULL; 4892f4259b30SLisandro Dalcin b->icol = NULL; 4893b810aeb4SBarry Smith b->reallocs = 0; 489436db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4895f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4896416022c9SBarry Smith b->nonew = 0; 4897f4259b30SLisandro Dalcin b->diag = NULL; 4898f4259b30SLisandro Dalcin b->solve_work = NULL; 4899f4259b30SLisandro Dalcin B->spptr = NULL; 4900f4259b30SLisandro Dalcin b->saved_values = NULL; 4901f4259b30SLisandro Dalcin b->idiag = NULL; 4902f4259b30SLisandro Dalcin b->mdiag = NULL; 4903f4259b30SLisandro Dalcin b->ssor_work = NULL; 490471f1c65dSBarry Smith b->omega = 1.0; 490571f1c65dSBarry Smith b->fshift = 0.0; 490671f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4907bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4908a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 490917ab2063SBarry Smith 49109566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4911d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4914b3866ffcSBarry Smith #endif 49159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49229779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4924191b95cbSRichard Tran Mills #endif 492534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49289566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 492902fe1965SBarry Smith #endif 4930d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4931d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4932d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4933d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4934d5e393b6SSuyash Tandon #endif 49353d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49373d0639e7SStefano Zampini #endif 49389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4939af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4941af8000cdSHong Zhang #endif 4942d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4944d24d4204SJose E. Roman #endif 494563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 494863c07aadSStefano Zampini #endif 49499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 495314e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 49569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49649566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49659566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 496817ab2063SBarry Smith } 496917ab2063SBarry Smith 4970b24902e0SBarry Smith /* 49713893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4972b24902e0SBarry Smith */ 4973d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4974d71ae5a4SJacob Faibussowitsch { 49752a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4976071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 497717ab2063SBarry Smith 49783a40ed3dSBarry Smith PetscFunctionBegin; 4979aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4980273d9f13SBarry Smith 4981d5f3da31SBarry Smith C->factortype = A->factortype; 4982f4259b30SLisandro Dalcin c->row = NULL; 4983f4259b30SLisandro Dalcin c->col = NULL; 4984f4259b30SLisandro Dalcin c->icol = NULL; 49856ad4291fSHong Zhang c->reallocs = 0; 4986bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 498717ab2063SBarry Smith 498869272f91SPierre Jolivet C->assembled = A->assembled; 498917ab2063SBarry Smith 499069272f91SPierre Jolivet if (A->preallocated) { 49919566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49929566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4993eec197d1SBarry Smith 499431fe6a7dSBarry Smith if (!A->hash_active) { 49959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49969566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 499917ab2063SBarry Smith 500017ab2063SBarry Smith /* allocate the matrix space */ 5001f77e22a1SHong Zhang if (mallocmatspace) { 50029566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 50032205254eSKarl Rupp 5004f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 50052205254eSKarl Rupp 50069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 500717ab2063SBarry Smith if (m > 0) { 50089566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 5009be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 50102e5835c6SStefano Zampini const PetscScalar *aa; 50112e5835c6SStefano Zampini 50129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50139566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5015be6bf707SBarry Smith } else { 50169566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 501717ab2063SBarry Smith } 501808480c60SBarry Smith } 5019f77e22a1SHong Zhang } 502031fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 502131fe6a7dSBarry Smith } else { 502231fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 502331fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 502431fe6a7dSBarry Smith } 502517ab2063SBarry Smith 50266ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5027416022c9SBarry Smith c->roworiented = a->roworiented; 5028416022c9SBarry Smith c->nonew = a->nonew; 5029416022c9SBarry Smith if (a->diag) { 50309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50319566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5032071fcb05SBarry Smith } else c->diag = NULL; 50332205254eSKarl Rupp 5034f4259b30SLisandro Dalcin c->solve_work = NULL; 5035f4259b30SLisandro Dalcin c->saved_values = NULL; 5036f4259b30SLisandro Dalcin c->idiag = NULL; 5037f4259b30SLisandro Dalcin c->ssor_work = NULL; 5038a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 5039e6b907acSBarry Smith c->free_a = PETSC_TRUE; 5040e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 50416ad4291fSHong Zhang 5042893ad86cSHong Zhang c->rmax = a->rmax; 5043416022c9SBarry Smith c->nz = a->nz; 50448ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5045754ec7b1SSatish Balay 50466ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50476ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5048cd6b891eSBarry Smith if (a->compressedrow.use) { 50496ad4291fSHong Zhang i = a->compressedrow.nrows; 50509566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50519566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50529566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 505327ea64f8SHong Zhang } else { 505427ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50550298fd71SBarry Smith c->compressedrow.i = NULL; 50560298fd71SBarry Smith c->compressedrow.rindex = NULL; 50576ad4291fSHong Zhang } 5058ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5059e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50604846f1f5SKris Buschelman 50619566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 506269272f91SPierre Jolivet } 50639566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 506517ab2063SBarry Smith } 506617ab2063SBarry Smith 5067d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5068d71ae5a4SJacob Faibussowitsch { 5069b24902e0SBarry Smith PetscFunctionBegin; 50709566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50719566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 507248a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50739566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50749566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5076b24902e0SBarry Smith } 5077b24902e0SBarry Smith 5078d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5079d71ae5a4SJacob Faibussowitsch { 508052f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 508152f91c60SVaclav Hapla 508252f91c60SVaclav Hapla PetscFunctionBegin; 508352f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 508452f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5085c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50869566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 508952f91c60SVaclav Hapla if (isbinary) { 50909566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 509152f91c60SVaclav Hapla } else if (ishdf5) { 509252f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50939566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 509452f91c60SVaclav Hapla #else 509552f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 509652f91c60SVaclav Hapla #endif 509752f91c60SVaclav Hapla } else { 509898921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 509952f91c60SVaclav Hapla } 51003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 510152f91c60SVaclav Hapla } 510252f91c60SVaclav Hapla 5103d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5104d71ae5a4SJacob Faibussowitsch { 51053ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 51063ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5107fbdbba38SShri Abhyankar 5108fbdbba38SShri Abhyankar PetscFunctionBegin; 51099566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5110bbead8a2SBarry Smith 51113ea6fe3dSLisandro Dalcin /* read in matrix header */ 51129566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 511308401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51149371c9d4SSatish Balay M = header[1]; 51159371c9d4SSatish Balay N = header[2]; 51169371c9d4SSatish Balay nz = header[3]; 511708401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 511808401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 511908401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5120fbdbba38SShri Abhyankar 51213ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51229566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51233ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51243ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51253ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51263ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51273ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51289566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51299566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51303ea6fe3dSLisandro Dalcin 51313ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51329566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5133aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51343ea6fe3dSLisandro Dalcin 5135fbdbba38SShri Abhyankar /* read in row lengths */ 51369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51379566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51383ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51399371c9d4SSatish Balay sum = 0; 51409371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 514108401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51423ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51449566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5145aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51463ea6fe3dSLisandro Dalcin /* store row lengths */ 51479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51489566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5149fbdbba38SShri Abhyankar 51503ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51519371c9d4SSatish Balay a->i[0] = 0; 51529371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51533ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51549566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51553ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51569566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5157fbdbba38SShri Abhyankar 51589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5161fbdbba38SShri Abhyankar } 5162fbdbba38SShri Abhyankar 5163d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5164d71ae5a4SJacob Faibussowitsch { 51657264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5166fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5167eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5168eeffb40dSHong Zhang PetscInt k; 5169eeffb40dSHong Zhang #endif 51707264ac53SSatish Balay 51713a40ed3dSBarry Smith PetscFunctionBegin; 5172bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5173d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5174ca44d042SBarry Smith *flg = PETSC_FALSE; 51753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5176bcd2baecSBarry Smith } 51777264ac53SSatish Balay 51787264ac53SSatish Balay /* if the a->i are the same */ 51799566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51803ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51817264ac53SSatish Balay 51827264ac53SSatish Balay /* if a->j are the same */ 51839566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51843ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5185bcd2baecSBarry Smith 51869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5188bcd2baecSBarry Smith /* if a->a are the same */ 5189eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5190eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5191fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5192eeffb40dSHong Zhang *flg = PETSC_FALSE; 51933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5194eeffb40dSHong Zhang } 5195eeffb40dSHong Zhang } 5196eeffb40dSHong Zhang #else 51979566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5198eeffb40dSHong Zhang #endif 51999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 52009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 52013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52027264ac53SSatish Balay } 520336db0b34SBarry Smith 520405869f15SSatish Balay /*@ 520511a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 520636db0b34SBarry Smith provided by the user. 520736db0b34SBarry Smith 5208d083f849SBarry Smith Collective 520936db0b34SBarry Smith 521036db0b34SBarry Smith Input Parameters: 521136db0b34SBarry Smith + comm - must be an MPI communicator of size 1 521236db0b34SBarry Smith . m - number of rows 521336db0b34SBarry Smith . n - number of columns 5214483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 521536db0b34SBarry Smith . j - column indices 521636db0b34SBarry Smith - a - matrix values 521736db0b34SBarry Smith 521836db0b34SBarry Smith Output Parameter: 521936db0b34SBarry Smith . mat - the matrix 522036db0b34SBarry Smith 522136db0b34SBarry Smith Level: intermediate 522236db0b34SBarry Smith 522336db0b34SBarry Smith Notes: 52242ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5225292fb18eSBarry Smith once the matrix is destroyed and not before 522636db0b34SBarry Smith 522736db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 522836db0b34SBarry Smith 52292ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 523036db0b34SBarry Smith 5231a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5232a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52338eef79e4SBarry Smith as shown 52342ef1f0ffSBarry Smith .vb 52352ef1f0ffSBarry Smith 1 0 0 52362ef1f0ffSBarry Smith 2 0 3 52372ef1f0ffSBarry Smith 4 5 6 5238a4552177SSatish Balay 52392ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52402ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52412ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52422ef1f0ffSBarry Smith .ve 5243a4552177SSatish Balay 52441cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 524536db0b34SBarry Smith @*/ 5246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5247d71ae5a4SJacob Faibussowitsch { 5248cbcfb4deSHong Zhang PetscInt ii; 524936db0b34SBarry Smith Mat_SeqAIJ *aij; 5250cbcfb4deSHong Zhang PetscInt jj; 525136db0b34SBarry Smith 525236db0b34SBarry Smith PetscFunctionBegin; 5253aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52549566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52559566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52569566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52579566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5259ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5262ab93d7beSBarry Smith 526336db0b34SBarry Smith aij->i = i; 526436db0b34SBarry Smith aij->j = j; 526536db0b34SBarry Smith aij->a = a; 526636db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 526736db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5268e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5269e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 527036db0b34SBarry Smith 5271cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 527236db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 527376bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5274aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52759985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 527608401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 527708401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52789985e31cSBarry Smith } 527936db0b34SBarry Smith } 528076bd3646SJed Brown } 528176bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 528236db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 528308401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5284da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 528536db0b34SBarry Smith } 528676bd3646SJed Brown } 528736db0b34SBarry Smith 52889566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52899566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 529136db0b34SBarry Smith } 5292cbc6b225SStefano Zampini 5293f62e3866SBarry Smith /*@ 529411a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52958a0b0e6bSVictor Minden provided by the user. 52968a0b0e6bSVictor Minden 5297d083f849SBarry Smith Collective 52988a0b0e6bSVictor Minden 52998a0b0e6bSVictor Minden Input Parameters: 53008a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 53018a0b0e6bSVictor Minden . m - number of rows 53028a0b0e6bSVictor Minden . n - number of columns 53038a0b0e6bSVictor Minden . i - row indices 53048a0b0e6bSVictor Minden . j - column indices 53051230e6d1SVictor Minden . a - matrix values 53061230e6d1SVictor Minden . nz - number of nonzeros 53072ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 53088a0b0e6bSVictor Minden 53098a0b0e6bSVictor Minden Output Parameter: 53108a0b0e6bSVictor Minden . mat - the matrix 53118a0b0e6bSVictor Minden 53128a0b0e6bSVictor Minden Level: intermediate 53138a0b0e6bSVictor Minden 5314f62e3866SBarry Smith Example: 5315f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53169e99939fSJunchao Zhang .vb 53178a0b0e6bSVictor Minden 1 0 0 53188a0b0e6bSVictor Minden 2 0 3 53198a0b0e6bSVictor Minden 4 5 6 53208a0b0e6bSVictor Minden 53218a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53228a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53238a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53249e99939fSJunchao Zhang .ve 5325fe59aa6dSJacob Faibussowitsch 53262ef1f0ffSBarry Smith Note: 5327d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5328d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53298a0b0e6bSVictor Minden 53301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53318a0b0e6bSVictor Minden @*/ 5332d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5333d71ae5a4SJacob Faibussowitsch { 5334d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53358a0b0e6bSVictor Minden 53368a0b0e6bSVictor Minden PetscFunctionBegin; 53379566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5338ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53399566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53409566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53419566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53431230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53441230e6d1SVictor Minden if (idx) { 53451230e6d1SVictor Minden row = i[ii] - 1; 53461230e6d1SVictor Minden col = j[ii] - 1; 53471230e6d1SVictor Minden } else { 53481230e6d1SVictor Minden row = i[ii]; 53491230e6d1SVictor Minden col = j[ii]; 53508a0b0e6bSVictor Minden } 53519566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53528a0b0e6bSVictor Minden } 53539566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53549566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53559566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53578a0b0e6bSVictor Minden } 535836db0b34SBarry Smith 5359d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5360d71ae5a4SJacob Faibussowitsch { 5361acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5362acf2f550SJed Brown 5363acf2f550SJed Brown PetscFunctionBegin; 5364acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5365acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53662205254eSKarl Rupp 53679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5369acf2f550SJed Brown } 5370acf2f550SJed Brown 5371d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5372d71ae5a4SJacob Faibussowitsch { 53739c8f2541SHong Zhang PetscFunctionBegin; 53749566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53769c8f2541SHong Zhang } 53779c8f2541SHong Zhang 537881824310SBarry Smith /* 537953dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 538053dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 538153dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 538253dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 538353dd7562SDmitry Karpeev */ 5384d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5385d71ae5a4SJacob Faibussowitsch { 538653dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 538753dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 538853dd7562SDmitry Karpeev PetscBool seqaij; 538953dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 539053dd7562SDmitry Karpeev PetscScalar v; 539153dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 539253dd7562SDmitry Karpeev 539353dd7562SDmitry Karpeev PetscFunctionBegin; 53943ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 539553dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53969566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 539728b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 539853dd7562SDmitry Karpeev if (rowemb) { 53999566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 540008401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 540153dd7562SDmitry Karpeev } else { 540208401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 540353dd7562SDmitry Karpeev } 540453dd7562SDmitry Karpeev if (colemb) { 54059566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 540608401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 540753dd7562SDmitry Karpeev } else { 540808401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 540953dd7562SDmitry Karpeev } 541053dd7562SDmitry Karpeev 5411f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 541253dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 54139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5414ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54169566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 541753dd7562SDmitry Karpeev } 541848a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 541953dd7562SDmitry Karpeev count = 0; 542053dd7562SDmitry Karpeev rowindices = NULL; 542153dd7562SDmitry Karpeev colindices = NULL; 542248a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 542348a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 542453dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 542553dd7562SDmitry Karpeev PetscInt row; 542653dd7562SDmitry Karpeev row = i; 542753dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 542853dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 542953dd7562SDmitry Karpeev PetscInt col; 543053dd7562SDmitry Karpeev col = Baij->j[count]; 543153dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 543253dd7562SDmitry Karpeev v = Baij->a[count]; 54339566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 543453dd7562SDmitry Karpeev ++count; 543553dd7562SDmitry Karpeev } 543653dd7562SDmitry Karpeev } 543753dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 543853dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 543953dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 544053dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 544153dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 544353dd7562SDmitry Karpeev } 544453dd7562SDmitry Karpeev 544558c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5446dec0b466SHong Zhang { 5447dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5448dec0b466SHong Zhang MatScalar *aa = a->a; 5449dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5450dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5451dec0b466SHong Zhang 5452dec0b466SHong Zhang PetscFunctionBegin; 5453dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5454dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5455dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5456dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5457dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 545858c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5459dec0b466SHong Zhang else { 5460dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5461dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5462dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5463dec0b466SHong Zhang } 5464dec0b466SHong Zhang } 5465dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5466dec0b466SHong Zhang fshift_prev = fshift; 5467dec0b466SHong Zhang /* reset ilen and imax for each row */ 5468dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5469dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5470dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5471dec0b466SHong Zhang } 5472312eded4SPierre Jolivet if (fshift) { 5473dec0b466SHong Zhang if (m) { 5474dec0b466SHong Zhang ai[m] -= fshift; 5475dec0b466SHong Zhang a->nz = ai[m]; 5476dec0b466SHong Zhang } 5477dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5478312eded4SPierre Jolivet A->nonzerostate++; 5479dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5480dec0b466SHong Zhang a->rmax = rmax; 5481dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5482dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5483dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5484312eded4SPierre Jolivet } 54853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5486dec0b466SHong Zhang } 5487dec0b466SHong Zhang 54884099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54894099cc6bSBarry Smith 5490cc4c1da9SBarry Smith /*@ 549111a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54924099cc6bSBarry Smith 5493c3339decSBarry Smith Collective 54944099cc6bSBarry Smith 54954099cc6bSBarry Smith Input Parameters: 54964099cc6bSBarry Smith + mat - the matrix object 54974099cc6bSBarry Smith - matype - matrix type 54984099cc6bSBarry Smith 54994099cc6bSBarry Smith Options Database Key: 55004e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 55014099cc6bSBarry Smith 55024099cc6bSBarry Smith Level: intermediate 55034099cc6bSBarry Smith 5504fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 55054099cc6bSBarry Smith @*/ 5506d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5507d71ae5a4SJacob Faibussowitsch { 55084099cc6bSBarry Smith PetscBool sametype; 55095f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 55104099cc6bSBarry Smith 55114099cc6bSBarry Smith PetscFunctionBegin; 55124099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 55139566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55143ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55154099cc6bSBarry Smith 55169566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55176adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55189566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55204099cc6bSBarry Smith } 55214099cc6bSBarry Smith 55224099cc6bSBarry Smith /*@C 552311a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55244099cc6bSBarry Smith 5525cc4c1da9SBarry Smith Not Collective, No Fortran Support 55264099cc6bSBarry Smith 55274099cc6bSBarry Smith Input Parameters: 5528fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55294099cc6bSBarry Smith - function - routine to convert to subtype 55304099cc6bSBarry Smith 55312ef1f0ffSBarry Smith Level: advanced 55322ef1f0ffSBarry Smith 55334099cc6bSBarry Smith Notes: 553411a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55354099cc6bSBarry Smith 55364099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55374099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55384099cc6bSBarry Smith 55391cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55404099cc6bSBarry Smith @*/ 5541d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5542d71ae5a4SJacob Faibussowitsch { 55434099cc6bSBarry Smith PetscFunctionBegin; 55449566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55459566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55474099cc6bSBarry Smith } 55484099cc6bSBarry Smith 55494099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55504099cc6bSBarry Smith 55514099cc6bSBarry Smith /*@C 555211a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55534099cc6bSBarry Smith 55544099cc6bSBarry Smith Not Collective 55554099cc6bSBarry Smith 55564099cc6bSBarry Smith Level: advanced 55574099cc6bSBarry Smith 55582ef1f0ffSBarry Smith Note: 55592ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55602ef1f0ffSBarry Smith 55611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55624099cc6bSBarry Smith @*/ 5563d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5564d71ae5a4SJacob Faibussowitsch { 55654099cc6bSBarry Smith PetscFunctionBegin; 55663ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55674099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55684099cc6bSBarry Smith 55699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55729779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5574485f9817SRichard Tran Mills #endif 55755063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55775063d097SStefano Zampini #endif 5578d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5579d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5580d5e393b6SSuyash Tandon #endif 55815063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55835063d097SStefano Zampini #endif 55844099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55864099cc6bSBarry Smith #endif 55873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55884099cc6bSBarry Smith } 558953dd7562SDmitry Karpeev 559053dd7562SDmitry Karpeev /* 559181824310SBarry Smith Special version for direct calls from Fortran 559281824310SBarry Smith */ 559381824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 559481824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 559581824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 559681824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 559781824310SBarry Smith #endif 559881824310SBarry Smith 559981824310SBarry Smith /* Change these macros so can be used in void function */ 560098921bdaSJacob Faibussowitsch 560198921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 56029566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 56039566063dSJacob Faibussowitsch #undef PetscCall 56049371c9d4SSatish Balay #define PetscCall(...) \ 56059371c9d4SSatish Balay do { \ 56065f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 560798921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 560898921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 560998921bdaSJacob Faibussowitsch return; \ 561098921bdaSJacob Faibussowitsch } \ 561198921bdaSJacob Faibussowitsch } while (0) 561298921bdaSJacob Faibussowitsch 561398921bdaSJacob Faibussowitsch #undef SETERRQ 56149371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56159371c9d4SSatish Balay do { \ 561698921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 561798921bdaSJacob Faibussowitsch return; \ 561898921bdaSJacob Faibussowitsch } while (0) 561981824310SBarry Smith 5620d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5621d71ae5a4SJacob Faibussowitsch { 562281824310SBarry Smith Mat A = *AA; 562381824310SBarry Smith PetscInt m = *mm, n = *nn; 562481824310SBarry Smith InsertMode is = *isis; 562581824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 562681824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 562781824310SBarry Smith PetscInt *imax, *ai, *ailen; 562881824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 562954f21887SBarry Smith MatScalar *ap, value, *aa; 5630ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5631ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 563281824310SBarry Smith 563381824310SBarry Smith PetscFunctionBegin; 56344994cf47SJed Brown MatCheckPreallocated(A, 1); 563581824310SBarry Smith imax = a->imax; 563681824310SBarry Smith ai = a->i; 563781824310SBarry Smith ailen = a->ilen; 563881824310SBarry Smith aj = a->j; 563981824310SBarry Smith aa = a->a; 564081824310SBarry Smith 564181824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 564281824310SBarry Smith row = im[k]; 564381824310SBarry Smith if (row < 0) continue; 56445f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56459371c9d4SSatish Balay rp = aj + ai[row]; 56469371c9d4SSatish Balay ap = aa + ai[row]; 56479371c9d4SSatish Balay rmax = imax[row]; 56489371c9d4SSatish Balay nrow = ailen[row]; 564981824310SBarry Smith low = 0; 565081824310SBarry Smith high = nrow; 565181824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 565281824310SBarry Smith if (in[l] < 0) continue; 56535f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 565481824310SBarry Smith col = in[l]; 56552205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56562205254eSKarl Rupp else value = v[k + l * m]; 56572205254eSKarl Rupp 565881824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 565981824310SBarry Smith 56602205254eSKarl Rupp if (col <= lastcol) low = 0; 56612205254eSKarl Rupp else high = nrow; 566281824310SBarry Smith lastcol = col; 566381824310SBarry Smith while (high - low > 5) { 566481824310SBarry Smith t = (low + high) / 2; 566581824310SBarry Smith if (rp[t] > col) high = t; 566681824310SBarry Smith else low = t; 566781824310SBarry Smith } 566881824310SBarry Smith for (i = low; i < high; i++) { 566981824310SBarry Smith if (rp[i] > col) break; 567081824310SBarry Smith if (rp[i] == col) { 567181824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 567281824310SBarry Smith else ap[i] = value; 567381824310SBarry Smith goto noinsert; 567481824310SBarry Smith } 567581824310SBarry Smith } 567681824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 567781824310SBarry Smith if (nonew == 1) goto noinsert; 56785f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5679fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56809371c9d4SSatish Balay N = nrow++ - 1; 56819371c9d4SSatish Balay a->nz++; 56829371c9d4SSatish Balay high++; 568381824310SBarry Smith /* shift up all the later entries in this row */ 568481824310SBarry Smith for (ii = N; ii >= i; ii--) { 568581824310SBarry Smith rp[ii + 1] = rp[ii]; 568681824310SBarry Smith ap[ii + 1] = ap[ii]; 568781824310SBarry Smith } 568881824310SBarry Smith rp[i] = col; 568981824310SBarry Smith ap[i] = value; 569081824310SBarry Smith noinsert:; 569181824310SBarry Smith low = i + 1; 569281824310SBarry Smith } 569381824310SBarry Smith ailen[row] = nrow; 569481824310SBarry Smith } 569581824310SBarry Smith PetscFunctionReturnVoid(); 569681824310SBarry Smith } 569798921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 569898921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 569998921bdaSJacob Faibussowitsch * original definitions */ 57009566063dSJacob Faibussowitsch #undef PetscCall 570198921bdaSJacob Faibussowitsch #undef SETERRQ 5702