1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 57748a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 5809566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6669566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6679566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6683ea6fe3dSLisandro Dalcin /* store column indices */ 6699566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 670416022c9SBarry Smith /* store nonzero values */ 6719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 674b37d52dbSMark F. Adams 6753ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6769566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 67817ab2063SBarry Smith } 679416022c9SBarry Smith 680d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 681d71ae5a4SJacob Faibussowitsch { 6827dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6837dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6847dc0baabSHong Zhang 6857dc0baabSHong Zhang PetscFunctionBegin; 6869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6877dc0baabSHong Zhang for (i = 0; i < m; i++) { 6889566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 68948a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6917dc0baabSHong Zhang } 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6947dc0baabSHong Zhang } 6957dc0baabSHong Zhang 69609573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 697cd155464SBarry Smith 698ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 699d71ae5a4SJacob Faibussowitsch { 700416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 701c898d852SStefano Zampini const PetscScalar *av; 70260e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 703e060cb09SBarry Smith const char *name; 704f3ef73ceSBarry Smith PetscViewerFormat format; 70517ab2063SBarry Smith 7063a40ed3dSBarry Smith PetscFunctionBegin; 7077dc0baabSHong Zhang if (A->structure_only) { 7089566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7107dc0baabSHong Zhang } 71143e49210SHong Zhang 7129566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 713bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7143ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7152e5835c6SStefano Zampini 716c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 71971c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72097f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72160e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 722c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 723d00d2cf4SBarry Smith nofinalvalue = 1; 724d00d2cf4SBarry Smith } 7259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 728fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 730fbfe6fa7SJed Brown #else 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 732fbfe6fa7SJed Brown #endif 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73417ab2063SBarry Smith 73517ab2063SBarry Smith for (i = 0; i < m; i++) { 73660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 737aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 73917ab2063SBarry Smith #else 7409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74117ab2063SBarry Smith #endif 74217ab2063SBarry Smith } 74317ab2063SBarry Smith } 744d00d2cf4SBarry Smith if (nofinalvalue) { 745c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 747c337ccceSJed Brown #else 7489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 749c337ccceSJed Brown #endif 750d00d2cf4SBarry Smith } 7519566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 754fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 75644cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 75860e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 759aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76436db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7666831982aSBarry Smith } 76744cd7ae7SLois Curfman McInnes #else 7689566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 76944cd7ae7SLois Curfman McInnes #endif 77044cd7ae7SLois Curfman McInnes } 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77244cd7ae7SLois Curfman McInnes } 7739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 774fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 77597f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 778496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 779496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 781496be53dSLois Curfman McInnes if (a->j[j] >= i) { 782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 784496be53dSLois Curfman McInnes #else 785496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 786496be53dSLois Curfman McInnes #endif 787496be53dSLois Curfman McInnes } 788496be53dSLois Curfman McInnes } 789496be53dSLois Curfman McInnes } 7902e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7922e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7932205254eSKarl Rupp if (i + 4 < m) { 7949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 7952205254eSKarl Rupp } else if (i + 3 < m) { 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 7972205254eSKarl Rupp } else if (i + 2 < m) { 7989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 7992205254eSKarl Rupp } else if (i + 1 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8012205254eSKarl Rupp } else if (i < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8032205254eSKarl Rupp } else { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8052205254eSKarl Rupp } 806496be53dSLois Curfman McInnes } 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8089566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 809496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81060e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8119566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 814496be53dSLois Curfman McInnes } 8159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 816496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 818496be53dSLois Curfman McInnes if (a->j[j] >= i) { 819aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82048a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 821496be53dSLois Curfman McInnes #else 8229566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 823496be53dSLois Curfman McInnes #endif 824496be53dSLois Curfman McInnes } 825496be53dSLois Curfman McInnes } 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 827496be53dSLois Curfman McInnes } 8289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 829fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83097f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83187828ca2SBarry Smith PetscScalar value; 83268f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83368f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83468f1ed48SBarry Smith 83568f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 83668f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 83768f1ed48SBarry Smith realonly = PETSC_FALSE; 83868f1ed48SBarry Smith break; 83968f1ed48SBarry Smith } 84068f1ed48SBarry Smith } 84168f1ed48SBarry Smith #endif 84202594712SBarry Smith 8439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84402594712SBarry Smith for (i = 0; i < m; i++) { 84502594712SBarry Smith jcnt = 0; 846d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 847e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 84802594712SBarry Smith value = a->a[cnt++]; 849e24b481bSBarry Smith jcnt++; 85002594712SBarry Smith } else { 85102594712SBarry Smith value = 0.0; 85202594712SBarry Smith } 853aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85468f1ed48SBarry Smith if (realonly) { 8559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 85668f1ed48SBarry Smith } else { 8579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 85868f1ed48SBarry Smith } 85902594712SBarry Smith #else 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86102594712SBarry Smith #endif 86202594712SBarry Smith } 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86402594712SBarry Smith } 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8663c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 867150b93efSMatthew G. Knepley PetscInt fshift = 1; 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8693c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8713c215bfdSMatthew Knepley #else 8729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8733c215bfdSMatthew Knepley #endif 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8753c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 87660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8773c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8793c215bfdSMatthew Knepley #else 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8813c215bfdSMatthew Knepley #endif 8823c215bfdSMatthew Knepley } 8833c215bfdSMatthew Knepley } 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8853a40ed3dSBarry Smith } else { 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 887d5f3da31SBarry Smith if (A->factortype) { 88816cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89016cd7e1dSShri Abhyankar /* L part */ 89160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 89516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 89716cd7e1dSShri Abhyankar } else { 8989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 89916cd7e1dSShri Abhyankar } 90016cd7e1dSShri Abhyankar #else 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90216cd7e1dSShri Abhyankar #endif 90316cd7e1dSShri Abhyankar } 90416cd7e1dSShri Abhyankar /* diagonal */ 90516cd7e1dSShri Abhyankar j = a->diag[i]; 90616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 90716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 90916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91116cd7e1dSShri Abhyankar } else { 9129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91316cd7e1dSShri Abhyankar } 91416cd7e1dSShri Abhyankar #else 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 91616cd7e1dSShri Abhyankar #endif 91716cd7e1dSShri Abhyankar 91816cd7e1dSShri Abhyankar /* U part */ 91960e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92116cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92316cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 92516cd7e1dSShri Abhyankar } else { 9269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 92716cd7e1dSShri Abhyankar } 92816cd7e1dSShri Abhyankar #else 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93016cd7e1dSShri Abhyankar #endif 93116cd7e1dSShri Abhyankar } 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar } else { 93517ab2063SBarry Smith for (i = 0; i < m; i++) { 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 93760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 938aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 93936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94136db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9433a40ed3dSBarry Smith } else { 9449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 94517ab2063SBarry Smith } 94617ab2063SBarry Smith #else 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 94817ab2063SBarry Smith #endif 94917ab2063SBarry Smith } 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95117ab2063SBarry Smith } 95216cd7e1dSShri Abhyankar } 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 957416022c9SBarry Smith } 958416022c9SBarry Smith 9599804daf3SBarry Smith #include <petscdraw.h> 960ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 961d71ae5a4SJacob Faibussowitsch { 962480ef9eaSBarry Smith Mat A = (Mat)Aa; 963416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 964383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 965383922c3SLisandro Dalcin int color; 966b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 967b0a32e0cSBarry Smith PetscViewer viewer; 968f3ef73ceSBarry Smith PetscViewerFormat format; 969fff043a9SJunchao Zhang const PetscScalar *aa; 970cddf8d76SBarry Smith 9713a40ed3dSBarry Smith PetscFunctionBegin; 9729566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9739566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9749566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 975383922c3SLisandro Dalcin 976416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 978fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 979d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9800513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 981b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 982416022c9SBarry Smith for (i = 0; i < m; i++) { 9839371c9d4SSatish Balay y_l = m - i - 1.0; 9849371c9d4SSatish Balay y_r = y_l + 1.0; 985bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9869371c9d4SSatish Balay x_l = a->j[j]; 9879371c9d4SSatish Balay x_r = x_l + 1.0; 988fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9899566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 990cddf8d76SBarry Smith } 991cddf8d76SBarry Smith } 992b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 993cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9949371c9d4SSatish Balay y_l = m - i - 1.0; 9959371c9d4SSatish Balay y_r = y_l + 1.0; 996bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9979371c9d4SSatish Balay x_l = a->j[j]; 9989371c9d4SSatish Balay x_r = x_l + 1.0; 999fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10009566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1001cddf8d76SBarry Smith } 1002cddf8d76SBarry Smith } 1003b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1004cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10059371c9d4SSatish Balay y_l = m - i - 1.0; 10069371c9d4SSatish Balay y_r = y_l + 1.0; 1007bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10089371c9d4SSatish Balay x_l = a->j[j]; 10099371c9d4SSatish Balay x_r = x_l + 1.0; 1010fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10119566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1012416022c9SBarry Smith } 1013416022c9SBarry Smith } 1014d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10150513a670SBarry Smith } else { 10160513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10170513a670SBarry Smith /* first determine max of all nonzero values */ 1018b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1019383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1020b0a32e0cSBarry Smith PetscDraw popup; 10210513a670SBarry Smith 10220513a670SBarry Smith for (i = 0; i < nz; i++) { 1023fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10240513a670SBarry Smith } 1025383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10269566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10279566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1028383922c3SLisandro Dalcin 1029d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10300513a670SBarry Smith for (i = 0; i < m; i++) { 1031383922c3SLisandro Dalcin y_l = m - i - 1.0; 1032383922c3SLisandro Dalcin y_r = y_l + 1.0; 1033bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1034383922c3SLisandro Dalcin x_l = a->j[j]; 1035383922c3SLisandro Dalcin x_r = x_l + 1.0; 1036fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10379566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10380513a670SBarry Smith count++; 10390513a670SBarry Smith } 10400513a670SBarry Smith } 1041d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10420513a670SBarry Smith } 10439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1045480ef9eaSBarry Smith } 1046cddf8d76SBarry Smith 10479804daf3SBarry Smith #include <petscdraw.h> 1048ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1049d71ae5a4SJacob Faibussowitsch { 1050b0a32e0cSBarry Smith PetscDraw draw; 105136db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1052ace3abfcSBarry Smith PetscBool isnull; 1053480ef9eaSBarry Smith 1054480ef9eaSBarry Smith PetscFunctionBegin; 10559566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10569566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10573ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1058480ef9eaSBarry Smith 10599371c9d4SSatish Balay xr = A->cmap->n; 10609371c9d4SSatish Balay yr = A->rmap->n; 10619371c9d4SSatish Balay h = yr / 10.0; 10629371c9d4SSatish Balay w = xr / 10.0; 10639371c9d4SSatish Balay xr += w; 10649371c9d4SSatish Balay yr += h; 10659371c9d4SSatish Balay xl = -w; 10669371c9d4SSatish Balay yl = -h; 10679566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10689566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10699566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10709566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10719566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1073416022c9SBarry Smith } 1074416022c9SBarry Smith 1075d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1076d71ae5a4SJacob Faibussowitsch { 1077ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1078416022c9SBarry Smith 10793a40ed3dSBarry Smith PetscFunctionBegin; 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10819566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10829566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10831baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10841baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10851baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10869566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108817ab2063SBarry Smith } 108919bcc07fSBarry Smith 1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1091d71ae5a4SJacob Faibussowitsch { 1092416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1093580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1094bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 109554f21887SBarry Smith MatScalar *aa = a->a, *ap; 10963447b6efSHong Zhang PetscReal ratio = 0.6; 109717ab2063SBarry Smith 10983a40ed3dSBarry Smith PetscFunctionBegin; 10993ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1101b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1102b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11039566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1105b215bc84SStefano Zampini } 110617ab2063SBarry Smith 110743ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 110817ab2063SBarry Smith for (i = 1; i < m; i++) { 1109416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111017ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111194a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111217ab2063SBarry Smith if (fshift) { 1113bfeeae90SHong Zhang ip = aj + ai[i]; 1114bfeeae90SHong Zhang ap = aa + ai[i]; 111517ab2063SBarry Smith N = ailen[i]; 11169566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 111748a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 111817ab2063SBarry Smith } 111917ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112017ab2063SBarry Smith } 112117ab2063SBarry Smith if (m) { 112217ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112317ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112417ab2063SBarry Smith } 112517ab2063SBarry Smith /* reset ilen and imax for each row */ 11267b083b7cSBarry Smith a->nonzerorowcnt = 0; 1127396832f4SHong Zhang if (A->structure_only) { 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1130396832f4SHong Zhang } else { /* !A->structure_only */ 113117ab2063SBarry Smith for (i = 0; i < m; i++) { 113217ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11337b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113417ab2063SBarry Smith } 1135396832f4SHong Zhang } 1136bfeeae90SHong Zhang a->nz = ai[m]; 1137aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1138bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1139bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1140bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1141bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1142bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1143bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1144bc43efbbSJunchao Zhang break; 1145bc43efbbSJunchao Zhang } 1146bc43efbbSJunchao Zhang } 11479566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11502205254eSKarl Rupp 11518e58a170SBarry Smith A->info.mallocs += a->reallocs; 1152dd5f02e7SSatish Balay a->reallocs = 0; 11536712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115436db0b34SBarry Smith a->rmax = rmax; 11554e220ebcSLois Curfman McInnes 115648a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11579566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115917ab2063SBarry Smith } 116017ab2063SBarry Smith 1161ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1162d71ae5a4SJacob Faibussowitsch { 116399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116499cafbc1SBarry Smith PetscInt i, nz = a->nz; 11652e5835c6SStefano Zampini MatScalar *aa; 116699cafbc1SBarry Smith 116799cafbc1SBarry Smith PetscFunctionBegin; 11689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 116999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117399cafbc1SBarry Smith } 117499cafbc1SBarry Smith 1175ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1176d71ae5a4SJacob Faibussowitsch { 117799cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117899cafbc1SBarry Smith PetscInt i, nz = a->nz; 11792e5835c6SStefano Zampini MatScalar *aa; 118099cafbc1SBarry Smith 118199cafbc1SBarry Smith PetscFunctionBegin; 11829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118399cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118799cafbc1SBarry Smith } 118899cafbc1SBarry Smith 1189d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1190d71ae5a4SJacob Faibussowitsch { 1191fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1192fff043a9SJunchao Zhang MatScalar *aa; 11933a40ed3dSBarry Smith 11943a40ed3dSBarry Smith PetscFunctionBegin; 11959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 11969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 11979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 11989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120017ab2063SBarry Smith } 1201416022c9SBarry Smith 1202d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1203d71ae5a4SJacob Faibussowitsch { 1204416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1205d5d45c9bSBarry Smith 12063a40ed3dSBarry Smith PetscFunctionBegin; 1207b4e2f619SBarry Smith if (A->hash_active) { 1208e3c72094SPierre Jolivet A->ops[0] = a->cops; 1209b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1210b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1211b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1212b4e2f619SBarry Smith } 1213b4e2f619SBarry Smith 12143ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12159566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12169566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12179566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12189566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12199566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12209566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12219566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12229566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12259566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12289566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1230901853e0SKris Buschelman 12316718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12326718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12336718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12346718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12356718818eSStefano Zampini due to different matrix sizes */ 12369566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12376718818eSStefano Zampini 12389566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12392e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12402e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12472e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12482e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12492e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12502e956fe4SStefano Zampini #endif 12514222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12554222ddf1SHong Zhang #endif 1256d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1257d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1258d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1259d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1260d5e393b6SSuyash Tandon #endif 12613d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12633d0639e7SStefano Zampini #endif 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1265af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1267af8000cdSHong Zhang #endif 1268d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1270d24d4204SJose E. Roman #endif 127163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127463c07aadSStefano Zampini #endif 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12792e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12902e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12912e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12922e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12932e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12942e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 12962e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 12973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 129817ab2063SBarry Smith } 129917ab2063SBarry Smith 1300d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1301d71ae5a4SJacob Faibussowitsch { 1302416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13033a40ed3dSBarry Smith 13043a40ed3dSBarry Smith PetscFunctionBegin; 1305a65d3064SKris Buschelman switch (op) { 1306d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1307d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1308d71ae5a4SJacob Faibussowitsch break; 1309d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1310d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1311d71ae5a4SJacob Faibussowitsch break; 1312d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1313d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1314d71ae5a4SJacob Faibussowitsch break; 1315d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1316d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1317d71ae5a4SJacob Faibussowitsch break; 1318d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1319d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1320d71ae5a4SJacob Faibussowitsch break; 1321d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1322d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1323d71ae5a4SJacob Faibussowitsch break; 1324d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1325d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1326d71ae5a4SJacob Faibussowitsch break; 13273d472b54SHong Zhang case MAT_SPD: 1328b1646e73SJed Brown case MAT_SYMMETRIC: 1329b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1330b1646e73SJed Brown case MAT_HERMITIAN: 1331b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1332957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1333b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1334b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1335b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13365021d80fSJed Brown break; 13378c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1338a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1339d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1340d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1341d71ae5a4SJacob Faibussowitsch break; 1342d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1343d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1344d71ae5a4SJacob Faibussowitsch break; 1345d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1346d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1347d71ae5a4SJacob Faibussowitsch break; 1348071fcb05SBarry Smith case MAT_SORTED_FULL: 1349071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1350071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1351071fcb05SBarry Smith break; 1352d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1353d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1354d71ae5a4SJacob Faibussowitsch break; 1355d71ae5a4SJacob Faibussowitsch default: 1356d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1357a65d3064SKris Buschelman } 13583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 135917ab2063SBarry Smith } 136017ab2063SBarry Smith 1361ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1362d71ae5a4SJacob Faibussowitsch { 1363416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1364fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1365c898d852SStefano Zampini PetscScalar *x; 1366c898d852SStefano Zampini const PetscScalar *aa; 136717ab2063SBarry Smith 13683a40ed3dSBarry Smith PetscFunctionBegin; 13699566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1372d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1373d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13749566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13752c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 137935e7444dSHong Zhang } 138035e7444dSHong Zhang 13819566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138235e7444dSHong Zhang for (i = 0; i < n; i++) { 1383fdc842d1SBarry Smith x[i] = 0.0; 138435e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 138535e7444dSHong Zhang if (aj[j] == i) { 138635e7444dSHong Zhang x[i] = aa[j]; 138717ab2063SBarry Smith break; 138817ab2063SBarry Smith } 138917ab2063SBarry Smith } 139017ab2063SBarry Smith } 13919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139417ab2063SBarry Smith } 139517ab2063SBarry Smith 1396c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1397d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1398d71ae5a4SJacob Faibussowitsch { 1399416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14005f22a7b3SSebastian Grimberg const MatScalar *aa; 1401d9ca1df4SBarry Smith PetscScalar *y; 1402d9ca1df4SBarry Smith const PetscScalar *x; 1403d0f46423SBarry Smith PetscInt m = A->rmap->n; 14045c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14055f22a7b3SSebastian Grimberg const MatScalar *v; 1406a77337e4SBarry Smith PetscScalar alpha; 1407d9ca1df4SBarry Smith PetscInt n, i, j; 1408d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14093447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1410ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14115c897100SBarry Smith #endif 141217ab2063SBarry Smith 14133a40ed3dSBarry Smith PetscFunctionBegin; 14149566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14159566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14169566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14185c897100SBarry Smith 14195c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1420fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14215c897100SBarry Smith #else 14223447b6efSHong Zhang if (usecprow) { 14233447b6efSHong Zhang m = cprow.nrows; 14243447b6efSHong Zhang ii = cprow.i; 14257b2bb3b9SHong Zhang ridx = cprow.rindex; 14263447b6efSHong Zhang } else { 14273447b6efSHong Zhang ii = a->i; 14283447b6efSHong Zhang } 142917ab2063SBarry Smith for (i = 0; i < m; i++) { 14303447b6efSHong Zhang idx = a->j + ii[i]; 1431fff043a9SJunchao Zhang v = aa + ii[i]; 14323447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14333447b6efSHong Zhang if (usecprow) { 14347b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14353447b6efSHong Zhang } else { 143617ab2063SBarry Smith alpha = x[i]; 14373447b6efSHong Zhang } 143804fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 143917ab2063SBarry Smith } 14405c897100SBarry Smith #endif 14419566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14429566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14439566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 144617ab2063SBarry Smith } 144717ab2063SBarry Smith 1448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1449d71ae5a4SJacob Faibussowitsch { 14505c897100SBarry Smith PetscFunctionBegin; 14519566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14529566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14545c897100SBarry Smith } 14555c897100SBarry Smith 1456c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 145778b84d54SShri Abhyankar 1458d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1459d71ae5a4SJacob Faibussowitsch { 1460416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1461d9fead3dSBarry Smith PetscScalar *y; 146254f21887SBarry Smith const PetscScalar *x; 14635914357eSBarry Smith const MatScalar *a_a; 1464003131ecSBarry Smith PetscInt m = A->rmap->n; 14655914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1466ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 146717ab2063SBarry Smith 1468b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 146997952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1470fee21e36SBarry Smith #endif 1471fee21e36SBarry Smith 14723a40ed3dSBarry Smith PetscFunctionBegin; 1473b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14749566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1476b215bc84SStefano Zampini } 14779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14799566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1480416022c9SBarry Smith ii = a->i; 14814eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14829566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148397952fefSHong Zhang m = a->compressedrow.nrows; 148497952fefSHong Zhang ii = a->compressedrow.i; 148597952fefSHong Zhang ridx = a->compressedrow.rindex; 14865914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14875914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 14885914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 14895914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 14905914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 14915914357eSBarry Smith PetscScalar sum = 0.0; 1492003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1493003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149497952fefSHong Zhang y[*ridx++] = sum; 149597952fefSHong Zhang } 149697952fefSHong Zhang } else { /* do not use compressed row format */ 1497b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14985914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1499b05257ddSBarry Smith #else 15005914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15015914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15025914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15035914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15045914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15055914357eSBarry Smith PetscScalar sum = 0.0; 1506003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 150717ab2063SBarry Smith y[i] = sum; 150817ab2063SBarry Smith } 15098d195f9aSBarry Smith #endif 1510b05257ddSBarry Smith } 15119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15129566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15139566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 151617ab2063SBarry Smith } 151717ab2063SBarry Smith 1518ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1519ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1520d71ae5a4SJacob Faibussowitsch { 1521b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1522b434eb95SMatthew G. Knepley PetscScalar *y; 1523b434eb95SMatthew G. Knepley const PetscScalar *x; 1524fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1525b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1526b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1527b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1528b434eb95SMatthew G. Knepley PetscScalar sum; 1529b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1530b434eb95SMatthew G. Knepley 1531b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1532b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1533b434eb95SMatthew G. Knepley #endif 1534b434eb95SMatthew G. Knepley 1535b434eb95SMatthew G. Knepley PetscFunctionBegin; 15369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15379566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15389566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1539b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1540b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1541b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1542b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1543b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1544b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1545b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1546fff043a9SJunchao Zhang aa = a_a + ii[i]; 1547b434eb95SMatthew G. Knepley sum = 0.0; 1548b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1549b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1550b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1551b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1552b434eb95SMatthew G. Knepley } 1553b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15543d3eaba7SBarry Smith ii = a->i; 1555b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1556b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1557b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1558fff043a9SJunchao Zhang aa = a_a + ii[i]; 1559b434eb95SMatthew G. Knepley sum = 0.0; 1560b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1561b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1562b434eb95SMatthew G. Knepley y[i] = sum; 1563b434eb95SMatthew G. Knepley } 1564b434eb95SMatthew G. Knepley } 15659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15669566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15679566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley 1572ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1573ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1574d71ae5a4SJacob Faibussowitsch { 1575b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1576b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1577b434eb95SMatthew G. Knepley const PetscScalar *x; 1578fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1579b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1580b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1581b434eb95SMatthew G. Knepley PetscScalar sum; 1582b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1583b434eb95SMatthew G. Knepley 1584b434eb95SMatthew G. Knepley PetscFunctionBegin; 15859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15869566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15879566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1588b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 158948a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1590b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1591b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1592b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1593b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1594b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1595b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1596fff043a9SJunchao Zhang aa = a_a + ii[i]; 1597b434eb95SMatthew G. Knepley sum = y[*ridx]; 1598b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1599b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1600b434eb95SMatthew G. Knepley } 1601b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16023d3eaba7SBarry Smith ii = a->i; 1603b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1604b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1605b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1606fff043a9SJunchao Zhang aa = a_a + ii[i]; 1607b434eb95SMatthew G. Knepley sum = y[i]; 1608b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1609b434eb95SMatthew G. Knepley z[i] = sum; 1610b434eb95SMatthew G. Knepley } 1611b434eb95SMatthew G. Knepley } 16129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16139566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16149566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley 1619c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1621d71ae5a4SJacob Faibussowitsch { 1622416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1623f15663dcSBarry Smith PetscScalar *y, *z; 1624f15663dcSBarry Smith const PetscScalar *x; 16255914357eSBarry Smith const MatScalar *a_a; 16265914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16275914357eSBarry Smith PetscInt m = A->rmap->n; 1628ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16299ea0dfa2SSatish Balay 16303a40ed3dSBarry Smith PetscFunctionBegin; 1631b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16329566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1634b215bc84SStefano Zampini } 16359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16369566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16379566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16384eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 163948a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164097952fefSHong Zhang m = a->compressedrow.nrows; 164197952fefSHong Zhang ii = a->compressedrow.i; 164297952fefSHong Zhang ridx = a->compressedrow.rindex; 16435914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16445914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16455914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16465914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16475914357eSBarry Smith PetscScalar sum = y[*ridx]; 1648f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 164997952fefSHong Zhang z[*ridx++] = sum; 165097952fefSHong Zhang } 165197952fefSHong Zhang } else { /* do not use compressed row format */ 16523d3eaba7SBarry Smith ii = a->i; 1653f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16545914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1655f15663dcSBarry Smith #else 16565914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16575914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16585914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16595914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16605914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16615914357eSBarry Smith PetscScalar sum = y[i]; 1662f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166317ab2063SBarry Smith z[i] = sum; 166417ab2063SBarry Smith } 166502ab625aSSatish Balay #endif 1666f15663dcSBarry Smith } 16679566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167217ab2063SBarry Smith } 167317ab2063SBarry Smith 167417ab2063SBarry Smith /* 167517ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 167617ab2063SBarry Smith */ 1677d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1678d71ae5a4SJacob Faibussowitsch { 1679416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1680d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1681c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168217ab2063SBarry Smith 16833a40ed3dSBarry Smith PetscFunctionBegin; 168409f38230SBarry Smith if (!a->diag) { 16859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1686c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 168709f38230SBarry Smith } 1688d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1689c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1690c0c07093SJunchao Zhang if (alreadySet) { 1691c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1692c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1693c0c07093SJunchao Zhang } 1694c0c07093SJunchao Zhang 169509f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1696bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1697bfeeae90SHong Zhang if (a->j[j] == i) { 169809f38230SBarry Smith a->diag[i] = j; 169917ab2063SBarry Smith break; 170017ab2063SBarry Smith } 170117ab2063SBarry Smith } 170217ab2063SBarry Smith } 17033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 170417ab2063SBarry Smith } 170517ab2063SBarry Smith 1706ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1707d71ae5a4SJacob Faibussowitsch { 170861ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 170961ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171061ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171161ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171261ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 171361ecd0c6SBarry Smith 171461ecd0c6SBarry Smith PetscFunctionBegin; 171561ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17179566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171961ecd0c6SBarry Smith } 172061ecd0c6SBarry Smith 172161ecd0c6SBarry Smith if (a->diagonaldense) { 172261ecd0c6SBarry Smith cnt = 0; 172361ecd0c6SBarry Smith } else { 17249566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 172561ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1726349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 172761ecd0c6SBarry Smith cnt++; 172861ecd0c6SBarry Smith mdiag[i] = 1; 172961ecd0c6SBarry Smith } 173061ecd0c6SBarry Smith } 173161ecd0c6SBarry Smith } 173261ecd0c6SBarry Smith if (!cnt) { 17339566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 173461ecd0c6SBarry Smith } else { 1735b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1736b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 17379f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 17386ea2a7edSJunchao Zhang const PetscScalar *Aa; 17396ea2a7edSJunchao Zhang 17406ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17416ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 174261ecd0c6SBarry Smith 174361ecd0c6SBarry Smith a->a = NULL; 174461ecd0c6SBarry Smith a->j = NULL; 174561ecd0c6SBarry Smith a->i = NULL; 174661ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1747ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 174961ecd0c6SBarry Smith 175061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175161ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17529566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 175348a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1754447d62f5SStefano Zampini } 17559566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17569566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17579f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17589f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17599f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 176061ecd0c6SBarry Smith } 17619566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176261ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 176461ecd0c6SBarry Smith } 176561ecd0c6SBarry Smith 1766be5855fcSBarry Smith /* 1767be5855fcSBarry Smith Checks for missing diagonals 1768be5855fcSBarry Smith */ 1769d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1770d71ae5a4SJacob Faibussowitsch { 1771be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17727734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1773be5855fcSBarry Smith 1774be5855fcSBarry Smith PetscFunctionBegin; 177509f38230SBarry Smith *missing = PETSC_FALSE; 17767734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 177709f38230SBarry Smith *missing = PETSC_TRUE; 177809f38230SBarry Smith if (d) *d = 0; 17799566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178009f38230SBarry Smith } else { 178101445905SHong Zhang PetscInt n; 178201445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1783f1e2ffcdSBarry Smith diag = a->diag; 178401445905SHong Zhang for (i = 0; i < n; i++) { 17857734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 178609f38230SBarry Smith *missing = PETSC_TRUE; 178709f38230SBarry Smith if (d) *d = i; 17889566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1789358d2f5dSShri Abhyankar break; 179009f38230SBarry Smith } 1791be5855fcSBarry Smith } 1792be5855fcSBarry Smith } 17933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1794be5855fcSBarry Smith } 1795be5855fcSBarry Smith 17960da83c2eSBarry Smith #include <petscblaslapack.h> 17970da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17980da83c2eSBarry Smith 17990da83c2eSBarry Smith /* 18000da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18010da83c2eSBarry Smith */ 1802ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1803d71ae5a4SJacob Faibussowitsch { 18040da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18050da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18060da83c2eSBarry Smith const PetscReal shift = 0.0; 18070da83c2eSBarry Smith PetscInt ipvt[5]; 18084e208921SJed Brown PetscCount flops = 0; 18090da83c2eSBarry Smith PetscScalar work[25], *v_work; 18100da83c2eSBarry Smith 18110da83c2eSBarry Smith PetscFunctionBegin; 18120da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18130da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 181408401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1815ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 181748a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18180da83c2eSBarry Smith ncnt = 0; 18190da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18200da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18219566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18220da83c2eSBarry Smith switch (bsizes[i]) { 1823d71ae5a4SJacob Faibussowitsch case 1: 1824d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1825d71ae5a4SJacob Faibussowitsch break; 18260da83c2eSBarry Smith case 2: 18279566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18280da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18299566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18300da83c2eSBarry Smith break; 18310da83c2eSBarry Smith case 3: 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18330da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18350da83c2eSBarry Smith break; 18360da83c2eSBarry Smith case 4: 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18380da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18400da83c2eSBarry Smith break; 18410da83c2eSBarry Smith case 5: 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18430da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18450da83c2eSBarry Smith break; 18460da83c2eSBarry Smith case 6: 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18480da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18500da83c2eSBarry Smith break; 18510da83c2eSBarry Smith case 7: 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18530da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18550da83c2eSBarry Smith break; 18560da83c2eSBarry Smith default: 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18580da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18600da83c2eSBarry Smith } 18610da83c2eSBarry Smith ncnt += bsizes[i]; 18620da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1863baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18640da83c2eSBarry Smith } 18653ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 186648a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18679566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18690da83c2eSBarry Smith } 18700da83c2eSBarry Smith 1871422a814eSBarry Smith /* 1872422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1873422a814eSBarry Smith */ 1874ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1875d71ae5a4SJacob Faibussowitsch { 187671f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1877d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18782e5835c6SStefano Zampini const MatScalar *v; 187954f21887SBarry Smith PetscScalar *idiag, *mdiag; 188071f1c65dSBarry Smith 188171f1c65dSBarry Smith PetscFunctionBegin; 18823ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18839566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 188471f1c65dSBarry Smith diag = a->diag; 18854dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18862e5835c6SStefano Zampini 188771f1c65dSBarry Smith mdiag = a->mdiag; 188871f1c65dSBarry Smith idiag = a->idiag; 18899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1890422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189171f1c65dSBarry Smith for (i = 0; i < m; i++) { 189271f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1893899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1894899639b0SHong Zhang if (PetscRealPart(fshift)) { 18959566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 18967b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18977b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18987b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 189998921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1900899639b0SHong Zhang } 190171f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190271f1c65dSBarry Smith } 19039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 190471f1c65dSBarry Smith } else { 190571f1c65dSBarry Smith for (i = 0; i < m; i++) { 190671f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 190771f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 190871f1c65dSBarry Smith } 19099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191071f1c65dSBarry Smith } 191171f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 191471f1c65dSBarry Smith } 191571f1c65dSBarry Smith 1916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1917d71ae5a4SJacob Faibussowitsch { 1918416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1919e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19202e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192154f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19223d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 192397f1f81fSBarry Smith const PetscInt *idx, *diag; 192417ab2063SBarry Smith 19253a40ed3dSBarry Smith PetscFunctionBegin; 1926b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19279566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1929b215bc84SStefano Zampini } 1930b965ef7fSBarry Smith its = its * lits; 193191723122SBarry Smith 193271f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19339566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193471f1c65dSBarry Smith a->fshift = fshift; 193571f1c65dSBarry Smith a->omega = omega; 1936ed480e8bSBarry Smith 193771f1c65dSBarry Smith diag = a->diag; 193871f1c65dSBarry Smith t = a->ssor_work; 1939ed480e8bSBarry Smith idiag = a->idiag; 194071f1c65dSBarry Smith mdiag = a->mdiag; 1941ed480e8bSBarry Smith 19429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19439566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1945ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 194617ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 194717ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1948ed480e8bSBarry Smith bs = b; 194917ab2063SBarry Smith for (i = 0; i < m; i++) { 195071f1c65dSBarry Smith d = fshift + mdiag[i]; 1951416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1952ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19532e5835c6SStefano Zampini v = aa + diag[i] + 1; 195417ab2063SBarry Smith sum = b[i] * d / omega; 1955003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 195617ab2063SBarry Smith x[i] = sum; 195717ab2063SBarry Smith } 19589566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19599566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 196317ab2063SBarry Smith } 1964c783ea89SBarry Smith 196508401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1966f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19674c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1968887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 196917ab2063SBarry Smith 197017ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197117ab2063SBarry Smith 1972887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 197317ab2063SBarry Smith */ 197417ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 197517ab2063SBarry Smith 197617ab2063SBarry Smith /* x = (E + U)^{-1} b */ 197717ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1978416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1979ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19802e5835c6SStefano Zampini v = aa + diag[i] + 1; 198117ab2063SBarry Smith sum = b[i]; 1982e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1983ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198417ab2063SBarry Smith } 198517ab2063SBarry Smith 198617ab2063SBarry Smith /* t = b - (2*E - D)x */ 19872e5835c6SStefano Zampini v = aa; 19882205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 198917ab2063SBarry Smith 199017ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1991ed480e8bSBarry Smith ts = t; 1992416022c9SBarry Smith diag = a->diag; 199317ab2063SBarry Smith for (i = 0; i < m; i++) { 1994416022c9SBarry Smith n = diag[i] - a->i[i]; 1995ed480e8bSBarry Smith idx = a->j + a->i[i]; 19962e5835c6SStefano Zampini v = aa + a->i[i]; 199717ab2063SBarry Smith sum = t[i]; 1998003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 1999ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2000733d66baSBarry Smith /* x = x + t */ 2001733d66baSBarry Smith x[i] += t[i]; 200217ab2063SBarry Smith } 200317ab2063SBarry Smith 20049566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20059566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 200817ab2063SBarry Smith } 200917ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201117ab2063SBarry Smith for (i = 0; i < m; i++) { 2012416022c9SBarry Smith n = diag[i] - a->i[i]; 2013ed480e8bSBarry Smith idx = a->j + a->i[i]; 20142e5835c6SStefano Zampini v = aa + a->i[i]; 201517ab2063SBarry Smith sum = b[i]; 2016e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20175c99c7daSBarry Smith t[i] = sum; 2018ed480e8bSBarry Smith x[i] = sum * idiag[i]; 201917ab2063SBarry Smith } 20205c99c7daSBarry Smith xb = t; 20219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20223a40ed3dSBarry Smith } else xb = b; 202317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202417ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2025416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2026ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20272e5835c6SStefano Zampini v = aa + diag[i] + 1; 202817ab2063SBarry Smith sum = xb[i]; 2029e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20305c99c7daSBarry Smith if (xb == b) { 2031ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20325c99c7daSBarry Smith } else { 2033b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203417ab2063SBarry Smith } 20355c99c7daSBarry Smith } 20369566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 203717ab2063SBarry Smith } 203817ab2063SBarry Smith its--; 203917ab2063SBarry Smith } 204017ab2063SBarry Smith while (its--) { 204117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204217ab2063SBarry Smith for (i = 0; i < m; i++) { 2043b19a5dc2SMark Adams /* lower */ 2044b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2045ed480e8bSBarry Smith idx = a->j + a->i[i]; 20462e5835c6SStefano Zampini v = aa + a->i[i]; 204717ab2063SBarry Smith sum = b[i]; 2048e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2049b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2050b19a5dc2SMark Adams /* upper */ 2051b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2052b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20532e5835c6SStefano Zampini v = aa + diag[i] + 1; 2054b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2055b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 205617ab2063SBarry Smith } 2057b19a5dc2SMark Adams xb = t; 20589566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2059b19a5dc2SMark Adams } else xb = b; 206017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206117ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2062b19a5dc2SMark Adams sum = xb[i]; 2063b19a5dc2SMark Adams if (xb == b) { 2064b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2065416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2066ed480e8bSBarry Smith idx = a->j + a->i[i]; 20672e5835c6SStefano Zampini v = aa + a->i[i]; 2068e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2069ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2070b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2071b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2072b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20732e5835c6SStefano Zampini v = aa + diag[i] + 1; 2074b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2075b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207617ab2063SBarry Smith } 2077b19a5dc2SMark Adams } 2078b19a5dc2SMark Adams if (xb == b) { 20799566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2080b19a5dc2SMark Adams } else { 20819566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2082b19a5dc2SMark Adams } 208317ab2063SBarry Smith } 208417ab2063SBarry Smith } 20859566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20869566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 208917ab2063SBarry Smith } 209017ab2063SBarry Smith 2091ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2092d71ae5a4SJacob Faibussowitsch { 2093416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20944e220ebcSLois Curfman McInnes 20953a40ed3dSBarry Smith PetscFunctionBegin; 20964e220ebcSLois Curfman McInnes info->block_size = 1.0; 20973966268fSBarry Smith info->nz_allocated = a->maxnz; 20983966268fSBarry Smith info->nz_used = a->nz; 20993966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21003966268fSBarry Smith info->assemblies = A->num_ass; 21013966268fSBarry Smith info->mallocs = A->info.mallocs; 21024dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2103d5f3da31SBarry Smith if (A->factortype) { 21044e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21054e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21064e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21074e220ebcSLois Curfman McInnes } else { 21084e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21094e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21104e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21114e220ebcSLois Curfman McInnes } 21123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 211317ab2063SBarry Smith } 211417ab2063SBarry Smith 2115ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2116d71ae5a4SJacob Faibussowitsch { 2117416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2118c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 211997b48c8fSBarry Smith const PetscScalar *xx; 21202e5835c6SStefano Zampini PetscScalar *bb, *aa; 2121c7da8527SEric Chamberland PetscInt d = 0; 212217ab2063SBarry Smith 21233a40ed3dSBarry Smith PetscFunctionBegin; 212497b48c8fSBarry Smith if (x && b) { 21259566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21269566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 212797b48c8fSBarry Smith for (i = 0; i < N; i++) { 2128aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2129447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213097b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213197b48c8fSBarry Smith } 21329566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21339566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213497b48c8fSBarry Smith } 213597b48c8fSBarry Smith 21369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2137a9817697SBarry Smith if (a->keepnonzeropattern) { 2138f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2139aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21409566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2141f1e2ffcdSBarry Smith } 2142f4df32b1SMatthew Knepley if (diag != 0.0) { 2143c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2144c7da8527SEric Chamberland d = rows[i]; 2145447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214608401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2147c7da8527SEric Chamberland } 2148f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2149447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21502e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2151f1e2ffcdSBarry Smith } 2152f1e2ffcdSBarry Smith } 2153f1e2ffcdSBarry Smith } else { 2154f4df32b1SMatthew Knepley if (diag != 0.0) { 215517ab2063SBarry Smith for (i = 0; i < N; i++) { 2156aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21577ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2158447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2159447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2160447d62f5SStefano Zampini } else { 2161416022c9SBarry Smith a->ilen[rows[i]] = 1; 21622e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2163bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2164447d62f5SStefano Zampini } 2165447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21669566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 216717ab2063SBarry Smith } 216817ab2063SBarry Smith } 21693a40ed3dSBarry Smith } else { 217017ab2063SBarry Smith for (i = 0; i < N; i++) { 2171aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2172416022c9SBarry Smith a->ilen[rows[i]] = 0; 217317ab2063SBarry Smith } 217417ab2063SBarry Smith } 2175e56f5c9eSBarry Smith A->nonzerostate++; 2176f1e2ffcdSBarry Smith } 21779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2178dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218017ab2063SBarry Smith } 218117ab2063SBarry Smith 2182ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2183d71ae5a4SJacob Faibussowitsch { 21846e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21856e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21862b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21876e169961SBarry Smith const PetscScalar *xx; 21882e5835c6SStefano Zampini PetscScalar *bb, *aa; 21896e169961SBarry Smith 21906e169961SBarry Smith PetscFunctionBegin; 21913ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 21929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21936e169961SBarry Smith if (x && b) { 21949566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21959566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 21962b40b63fSBarry Smith vecs = PETSC_TRUE; 21976e169961SBarry Smith } 21989566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 21996e169961SBarry Smith for (i = 0; i < N; i++) { 2200aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22018e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22022205254eSKarl Rupp 22036e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22046e169961SBarry Smith } 22056e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22066e169961SBarry Smith if (!zeroed[i]) { 22076e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22084cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22092e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22102e5835c6SStefano Zampini aa[j] = 0.0; 22116e169961SBarry Smith } 22126e169961SBarry Smith } 22134cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22146e169961SBarry Smith } 22156e169961SBarry Smith if (x && b) { 22169566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22179566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22186e169961SBarry Smith } 22199566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22206e169961SBarry Smith if (diag != 0.0) { 22219566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22221d5a398dSstefano_zampini if (missing) { 22231d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22244cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2225aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22269566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22271d5a398dSstefano_zampini } 22281d5a398dSstefano_zampini } else { 2229ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22306e169961SBarry Smith } 22311d5a398dSstefano_zampini } 22329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2233dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22356e169961SBarry Smith } 22366e169961SBarry Smith 2237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2238d71ae5a4SJacob Faibussowitsch { 2239fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2240fff043a9SJunchao Zhang const PetscScalar *aa; 224117ab2063SBarry Smith 22423a40ed3dSBarry Smith PetscFunctionBegin; 22439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2244416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22458e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 224617ab2063SBarry Smith if (idx) { 22475c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2248f4259b30SLisandro Dalcin else *idx = NULL; 224917ab2063SBarry Smith } 22509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225217ab2063SBarry Smith } 225317ab2063SBarry Smith 2254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2255d71ae5a4SJacob Faibussowitsch { 22563a40ed3dSBarry Smith PetscFunctionBegin; 22573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225817ab2063SBarry Smith } 225917ab2063SBarry Smith 2260ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2261d71ae5a4SJacob Faibussowitsch { 2262416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22632e5835c6SStefano Zampini const MatScalar *v; 226436db0b34SBarry Smith PetscReal sum = 0.0; 226597f1f81fSBarry Smith PetscInt i, j; 226617ab2063SBarry Smith 22673a40ed3dSBarry Smith PetscFunctionBegin; 22689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 226917ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2270570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2271570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2272792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2273570b7f6dSBarry Smith #else 2274416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22759371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22769371c9d4SSatish Balay v++; 227717ab2063SBarry Smith } 22788f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2279570b7f6dSBarry Smith #endif 22809566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22813a40ed3dSBarry Smith } else if (type == NORM_1) { 228236db0b34SBarry Smith PetscReal *tmp; 228397f1f81fSBarry Smith PetscInt *jj = a->j; 22849566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2285064f8208SBarry Smith *nrm = 0.0; 2286416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22879371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22889371c9d4SSatish Balay v++; 228917ab2063SBarry Smith } 2290d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2291064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229217ab2063SBarry Smith } 22939566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 22953a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2296064f8208SBarry Smith *nrm = 0.0; 2297d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 22988e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 229917ab2063SBarry Smith sum = 0.0; 2300416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23019371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23029371c9d4SSatish Balay v2++; 230317ab2063SBarry Smith } 2304064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 230517ab2063SBarry Smith } 23069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2307f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231017ab2063SBarry Smith } 231117ab2063SBarry Smith 2312ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2313d71ae5a4SJacob Faibussowitsch { 23143d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 231554f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23162e5835c6SStefano Zampini const MatScalar *va, *vb; 231797f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2318cd0d46ebSvictorle 2319cd0d46ebSvictorle PetscFunctionBegin; 23209566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23219566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23225485867bSBarry Smith if (ma != nb || na != mb) { 23235485867bSBarry Smith *f = PETSC_FALSE; 23243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23255485867bSBarry Smith } 23269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23289371c9d4SSatish Balay aii = aij->i; 23299371c9d4SSatish Balay bii = bij->i; 23309371c9d4SSatish Balay adx = aij->j; 23319371c9d4SSatish Balay bdx = bij->j; 23329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2334cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2335cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2336cd0d46ebSvictorle 2337cd0d46ebSvictorle *f = PETSC_TRUE; 2338cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2339cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234097f1f81fSBarry Smith PetscInt idc, idr; 23415485867bSBarry Smith PetscScalar vc, vr; 2342cd0d46ebSvictorle /* column/row index/value */ 23435485867bSBarry Smith idc = adx[aptr[i]]; 23445485867bSBarry Smith idr = bdx[bptr[idc]]; 23455485867bSBarry Smith vc = va[aptr[i]]; 23465485867bSBarry Smith vr = vb[bptr[idc]]; 23475485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23485485867bSBarry Smith *f = PETSC_FALSE; 23495485867bSBarry Smith goto done; 2350cd0d46ebSvictorle } else { 23515485867bSBarry Smith aptr[i]++; 23525485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2353cd0d46ebSvictorle } 2354cd0d46ebSvictorle } 2355cd0d46ebSvictorle } 2356cd0d46ebSvictorle done: 23579566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23589566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2362cd0d46ebSvictorle } 2363cd0d46ebSvictorle 2364ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2365d71ae5a4SJacob Faibussowitsch { 23663d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 236754f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 236854f21887SBarry Smith MatScalar *va, *vb; 23691cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23701cbb95d3SBarry Smith 23711cbb95d3SBarry Smith PetscFunctionBegin; 23729566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23739566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23741cbb95d3SBarry Smith if (ma != nb || na != mb) { 23751cbb95d3SBarry Smith *f = PETSC_FALSE; 23763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23771cbb95d3SBarry Smith } 23789371c9d4SSatish Balay aii = aij->i; 23799371c9d4SSatish Balay bii = bij->i; 23809371c9d4SSatish Balay adx = aij->j; 23819371c9d4SSatish Balay bdx = bij->j; 23829371c9d4SSatish Balay va = aij->a; 23839371c9d4SSatish Balay vb = bij->a; 23849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23861cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23871cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23881cbb95d3SBarry Smith 23891cbb95d3SBarry Smith *f = PETSC_TRUE; 23901cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23911cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23921cbb95d3SBarry Smith PetscInt idc, idr; 23931cbb95d3SBarry Smith PetscScalar vc, vr; 23941cbb95d3SBarry Smith /* column/row index/value */ 23951cbb95d3SBarry Smith idc = adx[aptr[i]]; 23961cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23971cbb95d3SBarry Smith vc = va[aptr[i]]; 23981cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23991cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24001cbb95d3SBarry Smith *f = PETSC_FALSE; 24011cbb95d3SBarry Smith goto done; 24021cbb95d3SBarry Smith } else { 24031cbb95d3SBarry Smith aptr[i]++; 24041cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24051cbb95d3SBarry Smith } 24061cbb95d3SBarry Smith } 24071cbb95d3SBarry Smith } 24081cbb95d3SBarry Smith done: 24099566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24109566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24121cbb95d3SBarry Smith } 24131cbb95d3SBarry Smith 2414d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2415d71ae5a4SJacob Faibussowitsch { 2416416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2417fff8e43fSBarry Smith const PetscScalar *l, *r; 2418fff8e43fSBarry Smith PetscScalar x; 241954f21887SBarry Smith MatScalar *v; 2420fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2421fff8e43fSBarry Smith const PetscInt *jj; 242217ab2063SBarry Smith 24233a40ed3dSBarry Smith PetscFunctionBegin; 242417ab2063SBarry Smith if (ll) { 24253ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24263ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24279566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 242808401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24299566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 243117ab2063SBarry Smith for (i = 0; i < m; i++) { 243217ab2063SBarry Smith x = l[i]; 2433416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24342205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 243517ab2063SBarry Smith } 24369566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24379566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 243917ab2063SBarry Smith } 244017ab2063SBarry Smith if (rr) { 24419566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 244208401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24439566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24452e5835c6SStefano Zampini jj = a->j; 24462205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24489566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24499566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 245017ab2063SBarry Smith } 24519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 245317ab2063SBarry Smith } 245417ab2063SBarry Smith 2455d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2456d71ae5a4SJacob Faibussowitsch { 2457db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2458d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 245997f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24605d0c19d7SBarry Smith const PetscInt *irow, *icol; 24612e5835c6SStefano Zampini const PetscScalar *aa; 24625d0c19d7SBarry Smith PetscInt nrows, ncols; 246397f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2464fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2465416022c9SBarry Smith Mat C; 2466cdc6f3adSToby Isaac PetscBool stride; 246717ab2063SBarry Smith 24683a40ed3dSBarry Smith PetscFunctionBegin; 24699566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24709566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24719566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 247217ab2063SBarry Smith 24739566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2474ff718158SBarry Smith if (stride) { 24759566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2476ff718158SBarry Smith } else { 2477ff718158SBarry Smith first = 0; 2478ff718158SBarry Smith step = 0; 2479ff718158SBarry Smith } 2480fee21e36SBarry Smith if (stride && step == 1) { 248102834360SBarry Smith /* special case of contiguous rows */ 24829566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 248302834360SBarry Smith /* loop over new rows determining lens and starting points */ 248402834360SBarry Smith for (i = 0; i < nrows; i++) { 2485bfeeae90SHong Zhang kstart = ai[irow[i]]; 2486a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2487a91a9bebSLisandro Dalcin starts[i] = kstart; 248802834360SBarry Smith for (k = kstart; k < kend; k++) { 2489bfeeae90SHong Zhang if (aj[k] >= first) { 249002834360SBarry Smith starts[i] = k; 249102834360SBarry Smith break; 249202834360SBarry Smith } 249302834360SBarry Smith } 2494a2744918SBarry Smith sum = 0; 249502834360SBarry Smith while (k < kend) { 2496bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2497a2744918SBarry Smith sum++; 249802834360SBarry Smith } 2499a2744918SBarry Smith lens[i] = sum; 250002834360SBarry Smith } 250102834360SBarry Smith /* create submatrix */ 2502cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 250397f1f81fSBarry Smith PetscInt n_cols, n_rows; 25049566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2505aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25069566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 250708480c60SBarry Smith C = *B; 25083a40ed3dSBarry Smith } else { 25093bef6203SJed Brown PetscInt rbs, cbs; 25109566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25119566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25129566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25139566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25149566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25159566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 251708480c60SBarry Smith } 2518db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2519db02288aSLois Curfman McInnes 252002834360SBarry Smith /* loop over rows inserting into submatrix */ 2521fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2522db02288aSLois Curfman McInnes j_new = c->j; 2523db02288aSLois Curfman McInnes i_new = c->i; 25249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 252502834360SBarry Smith for (i = 0; i < nrows; i++) { 2526a2744918SBarry Smith ii = starts[i]; 2527a2744918SBarry Smith lensi = lens[i]; 2528810441c8SPierre Jolivet if (lensi) { 2529ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2531a2744918SBarry Smith a_new += lensi; 2532810441c8SPierre Jolivet } 2533a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2534a2744918SBarry Smith c->ilen[i] = lensi; 253502834360SBarry Smith } 2536fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25389566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25393a40ed3dSBarry Smith } else { 25409566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25419566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25434dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25446bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25454dcab191SBarry Smith smap[icol[i]] = i + 1; 25464dcab191SBarry Smith } 25474dcab191SBarry Smith 254802834360SBarry Smith /* determine lens of each row */ 254902834360SBarry Smith for (i = 0; i < nrows; i++) { 2550bfeeae90SHong Zhang kstart = ai[irow[i]]; 255102834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 255202834360SBarry Smith lens[i] = 0; 255302834360SBarry Smith for (k = kstart; k < kend; k++) { 2554ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 255502834360SBarry Smith } 255602834360SBarry Smith } 255717ab2063SBarry Smith /* Create and fill new matrix */ 2558a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2559ace3abfcSBarry Smith PetscBool equal; 25600f5bd95cSBarry Smith 256199141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2562aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25639566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2564fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25659566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 256608480c60SBarry Smith C = *B; 25673a40ed3dSBarry Smith } else { 25683bef6203SJed Brown PetscInt rbs, cbs; 25699566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25709566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25719566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25729566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 257337a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25749566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 257608480c60SBarry Smith } 25779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2578fb3c7e2dSJunchao Zhang 2579f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2580fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 258117ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258299141d43SSatish Balay row = irow[i]; 2583bfeeae90SHong Zhang kstart = ai[row]; 258499141d43SSatish Balay kend = kstart + a->ilen[row]; 2585bfeeae90SHong Zhang mat_i = c->i[i]; 25868e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25878e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 258899141d43SSatish Balay mat_ilen = c->ilen + i; 258917ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2590bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2591ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25922e5835c6SStefano Zampini *mat_a++ = aa[k]; 259399141d43SSatish Balay (*mat_ilen)++; 259417ab2063SBarry Smith } 259517ab2063SBarry Smith } 259617ab2063SBarry Smith } 25979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 259802834360SBarry Smith /* Free work space */ 25999566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26009566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26019566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2602cdc6f3adSToby Isaac /* sort */ 2603cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2604cdc6f3adSToby Isaac PetscInt ilen; 2605cdc6f3adSToby Isaac 2606cdc6f3adSToby Isaac mat_i = c->i[i]; 26078e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26088e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2609cdc6f3adSToby Isaac ilen = c->ilen[i]; 26109566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2611cdc6f3adSToby Isaac } 2612fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 261302834360SBarry Smith } 26148c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26159566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2616305c6ccfSStefano Zampini #endif 26179566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26189566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 261917ab2063SBarry Smith 26209566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2621416022c9SBarry Smith *B = C; 26223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 262317ab2063SBarry Smith } 262417ab2063SBarry Smith 2625ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2626d71ae5a4SJacob Faibussowitsch { 262782d44351SHong Zhang Mat B; 262882d44351SHong Zhang 262982d44351SHong Zhang PetscFunctionBegin; 2630c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26319566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26329566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26339566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26349566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26359566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 263682d44351SHong Zhang *subMat = B; 2637c2d650bdSHong Zhang } else { 26389566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2639c2d650bdSHong Zhang } 26403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264182d44351SHong Zhang } 264282d44351SHong Zhang 2643ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2644d71ae5a4SJacob Faibussowitsch { 264563b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 264663b91edcSBarry Smith Mat outA; 2647ace3abfcSBarry Smith PetscBool row_identity, col_identity; 264863b91edcSBarry Smith 26493a40ed3dSBarry Smith PetscFunctionBegin; 265008401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26511df811f5SHong Zhang 26529566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26539566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2654a871dcd8SBarry Smith 265563b91edcSBarry Smith outA = inA; 2656d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26579566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26589566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26592205254eSKarl Rupp 26609566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26619566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26622205254eSKarl Rupp 2663c3122656SLisandro Dalcin a->row = row; 26642205254eSKarl Rupp 26659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26672205254eSKarl Rupp 2668c3122656SLisandro Dalcin a->col = col; 266963b91edcSBarry Smith 267036db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26729566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2673f0ec6fceSSatish Balay 267494a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 267694a9d846SBarry Smith } 267763b91edcSBarry Smith 26789566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2679137fb511SHong Zhang if (row_identity && col_identity) { 26809566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2681137fb511SHong Zhang } else { 26829566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2683137fb511SHong Zhang } 26843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2685a871dcd8SBarry Smith } 2686a871dcd8SBarry Smith 2687d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2688d71ae5a4SJacob Faibussowitsch { 2689f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2690dfa0f9e5SStefano Zampini PetscScalar *v; 2691c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26923a40ed3dSBarry Smith 26933a40ed3dSBarry Smith PetscFunctionBegin; 26949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 26959566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2696792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 26979566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 26989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 26999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2701f0b747eeSBarry Smith } 2702f0b747eeSBarry Smith 2703d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2704d71ae5a4SJacob Faibussowitsch { 270516b64355SHong Zhang PetscInt i; 270616b64355SHong Zhang 270716b64355SHong Zhang PetscFunctionBegin; 270816b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27099566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271016b64355SHong Zhang 271148a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27129566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271316b64355SHong Zhang 271416b64355SHong Zhang if (submatj->rbuf1) { 27159566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27169566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 271716b64355SHong Zhang } 271816b64355SHong Zhang 271948a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27209566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272216b64355SHong Zhang } 272316b64355SHong Zhang 272416b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2725eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27269566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27279566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 272816b64355SHong Zhang #else 27299566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273016b64355SHong Zhang #endif 273116b64355SHong Zhang 273216b64355SHong Zhang if (!submatj->allcolumns) { 273316b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2734eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 273516b64355SHong Zhang #else 27369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 273716b64355SHong Zhang #endif 273816b64355SHong Zhang } 27399566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274016b64355SHong Zhang 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 274316b64355SHong Zhang } 274416b64355SHong Zhang 2745d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2746d71ae5a4SJacob Faibussowitsch { 274716b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27485c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 274916b64355SHong Zhang 275016b64355SHong Zhang PetscFunctionBegin; 27519566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27529566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275416b64355SHong Zhang } 275516b64355SHong Zhang 275689a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2757ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2758d71ae5a4SJacob Faibussowitsch { 27592d033e1fSHong Zhang PetscInt i; 27600fb991dcSHong Zhang Mat C; 27610fb991dcSHong Zhang Mat_SeqAIJ *c; 27620fb991dcSHong Zhang Mat_SubSppt *submatj; 27632d033e1fSHong Zhang 27642d033e1fSHong Zhang PetscFunctionBegin; 27652d033e1fSHong Zhang for (i = 0; i < n; i++) { 27660fb991dcSHong Zhang C = (*mat)[i]; 27670fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27680fb991dcSHong Zhang submatj = c->submatis1; 27692d033e1fSHong Zhang if (submatj) { 2770682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277126cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27729566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27739566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27749566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27753faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27769566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27779566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27789566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2779682e4c99SStefano Zampini } 27802d033e1fSHong Zhang } else { 27819566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27822d033e1fSHong Zhang } 27832d033e1fSHong Zhang } 278486e85357SHong Zhang 278563a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27869566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 278763a75b2aSHong Zhang 27889566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27902d033e1fSHong Zhang } 27912d033e1fSHong Zhang 2792ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2793d71ae5a4SJacob Faibussowitsch { 279497f1f81fSBarry Smith PetscInt i; 2795cddf8d76SBarry Smith 27963a40ed3dSBarry Smith PetscFunctionBegin; 279748a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2798cddf8d76SBarry Smith 279948a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2801cddf8d76SBarry Smith } 2802cddf8d76SBarry Smith 2803ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2804d71ae5a4SJacob Faibussowitsch { 2805e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28069a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28075d0c19d7SBarry Smith const PetscInt *idx; 28089a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2809f1af5d2fSBarry Smith PetscBT table; 2810bbd702dbSSatish Balay 28113a40ed3dSBarry Smith PetscFunctionBegin; 28129a88ca10SBarry Smith m = A->rmap->n / bs; 2813e4d965acSSatish Balay ai = a->i; 2814bfeeae90SHong Zhang aj = a->j; 28158a047759SSatish Balay 281608401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 281706763907SSatish Balay 28189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28199566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282006763907SSatish Balay 2821e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2822b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2823e4d965acSSatish Balay isz = 0; 28249566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2825e4d965acSSatish Balay 2826e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28279566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28289566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2829e4d965acSSatish Balay 28309a88ca10SBarry Smith if (bs > 1) { 28319a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28329a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28339a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28349a88ca10SBarry Smith } 28359a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28369a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28379a88ca10SBarry Smith 28389a88ca10SBarry Smith k = 0; 28399a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28409a88ca10SBarry Smith n = isz; 28419a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28429a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28439a88ca10SBarry Smith row = bs * nidx[k] + ll; 28449a88ca10SBarry Smith start = ai[row]; 28459a88ca10SBarry Smith end = ai[row + 1]; 28469a88ca10SBarry Smith for (l = start; l < end; l++) { 28479a88ca10SBarry Smith val = aj[l] / bs; 28489a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28499a88ca10SBarry Smith } 28509a88ca10SBarry Smith } 28519a88ca10SBarry Smith } 28529a88ca10SBarry Smith } 28539a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28549a88ca10SBarry Smith } else { 2855dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2856e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28572205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28584dcbc457SBarry Smith } 28599566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28609566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2861e4d965acSSatish Balay 286204a348a9SBarry Smith k = 0; 286304a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 286404a348a9SBarry Smith n = isz; 286506763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2866e4d965acSSatish Balay row = nidx[k]; 2867e4d965acSSatish Balay start = ai[row]; 2868e4d965acSSatish Balay end = ai[row + 1]; 286904a348a9SBarry Smith for (l = start; l < end; l++) { 2870efb16452SHong Zhang val = aj[l]; 28712205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2872e4d965acSSatish Balay } 2873e4d965acSSatish Balay } 2874e4d965acSSatish Balay } 28759566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2876e4d965acSSatish Balay } 28779a88ca10SBarry Smith } 28789566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28799566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28814dcbc457SBarry Smith } 288217ab2063SBarry Smith 2883ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2884d71ae5a4SJacob Faibussowitsch { 28850513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28863b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28875d0c19d7SBarry Smith const PetscInt *row, *col; 28885d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 288956cd22aeSBarry Smith IS icolp, irowp; 28900298fd71SBarry Smith PetscInt *cwork = NULL; 28910298fd71SBarry Smith PetscScalar *vwork = NULL; 28920513a670SBarry Smith 28933a40ed3dSBarry Smith PetscFunctionBegin; 28949566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 28959566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 28969566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 28979566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 28980513a670SBarry Smith 28990513a670SBarry Smith /* determine lengths of permuted rows */ 29009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29012205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29029566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29049566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29059566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29079566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29080513a670SBarry Smith 29099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29100513a670SBarry Smith for (i = 0; i < m; i++) { 29119566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29122205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29139566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29149566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29150513a670SBarry Smith } 29169566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29172205254eSKarl Rupp 29183c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29192205254eSKarl Rupp 29208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29219566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29229fe5e383SStefano Zampini #endif 29239566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29249566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29259566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29269566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29279566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29289566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 292948a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29310513a670SBarry Smith } 29320513a670SBarry Smith 2933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2934d71ae5a4SJacob Faibussowitsch { 2935cb5b572fSBarry Smith PetscFunctionBegin; 293633f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 293733f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2938be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2939be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29402e5835c6SStefano Zampini const PetscScalar *aa; 2941be6bf707SBarry Smith 29429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 294308401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29459566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2947cb5b572fSBarry Smith } else { 29489566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2949cb5b572fSBarry Smith } 29503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2951cb5b572fSBarry Smith } 2952cb5b572fSBarry Smith 2953d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2954d71ae5a4SJacob Faibussowitsch { 29556c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29566e111a19SKarl Rupp 29576c0721eeSBarry Smith PetscFunctionBegin; 29586c0721eeSBarry Smith *array = a->a; 29593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29606c0721eeSBarry Smith } 29616c0721eeSBarry Smith 2962d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2963d71ae5a4SJacob Faibussowitsch { 29646c0721eeSBarry Smith PetscFunctionBegin; 2965f38c1e66SStefano Zampini *array = NULL; 29663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29676c0721eeSBarry Smith } 2968273d9f13SBarry Smith 29698229c054SShri Abhyankar /* 29708229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29718229c054SShri Abhyankar have different nonzero structure. 29728229c054SShri Abhyankar */ 2973d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2974d71ae5a4SJacob Faibussowitsch { 2975b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2976ec7775f6SShri Abhyankar 2977ec7775f6SShri Abhyankar PetscFunctionBegin; 2978ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2979ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29808e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2981b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2982b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29838af7cee1SJed Brown nnz[i] = 0; 29848af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2985b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2986b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29878af7cee1SJed Brown nnz[i]++; 29888af7cee1SJed Brown } 29898af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2990ec7775f6SShri Abhyankar } 29913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2992ec7775f6SShri Abhyankar } 2993ec7775f6SShri Abhyankar 2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 2995d71ae5a4SJacob Faibussowitsch { 2996b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2997b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 2998b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 2999b264fe52SHong Zhang 3000b264fe52SHong Zhang PetscFunctionBegin; 3001b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30029566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3004b264fe52SHong Zhang } 3005b264fe52SHong Zhang 3006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3007d71ae5a4SJacob Faibussowitsch { 3008ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3009ac90fabeSBarry Smith 3010ac90fabeSBarry Smith PetscFunctionBegin; 3011134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3012134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3013134adf20SPierre Jolivet if (e) { 30149566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 301581fa06acSBarry Smith if (e) { 30169566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3017134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 301881fa06acSBarry Smith } 301981fa06acSBarry Smith } 302054c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 302181fa06acSBarry Smith } 3022ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30232e5835c6SStefano Zampini const PetscScalar *xa; 30242e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 302581fa06acSBarry Smith PetscBLASInt one = 1, bnz; 302681fa06acSBarry Smith 30279566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3030792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30339566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30359566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3036ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30379566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3038ac90fabeSBarry Smith } else { 30398229c054SShri Abhyankar Mat B; 30408229c054SShri Abhyankar PetscInt *nnz; 30419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30429566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30439566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30449566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30459566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30469566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30489566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30499566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30509bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30519566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3052ac90fabeSBarry Smith } 30533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3054ac90fabeSBarry Smith } 3055ac90fabeSBarry Smith 3056d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3057d71ae5a4SJacob Faibussowitsch { 3058354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3059354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3060354c94deSBarry Smith PetscInt i, nz; 3061354c94deSBarry Smith PetscScalar *a; 3062354c94deSBarry Smith 3063354c94deSBarry Smith PetscFunctionBegin; 3064354c94deSBarry Smith nz = aij->nz; 30659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30662205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3068354c94deSBarry Smith #else 3069354c94deSBarry Smith PetscFunctionBegin; 3070354c94deSBarry Smith #endif 30713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3072354c94deSBarry Smith } 3073354c94deSBarry Smith 3074ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3075d71ae5a4SJacob Faibussowitsch { 3076e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3077d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3078e34fafa9SBarry Smith PetscReal atmp; 3079985db425SBarry Smith PetscScalar *x; 3080ce496241SStefano Zampini const MatScalar *aa, *av; 3081e34fafa9SBarry Smith 3082e34fafa9SBarry Smith PetscFunctionBegin; 308328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3085ce496241SStefano Zampini aa = av; 3086e34fafa9SBarry Smith ai = a->i; 3087e34fafa9SBarry Smith aj = a->j; 3088e34fafa9SBarry Smith 30899566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 30909566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30919566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 309208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3093e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30949371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30959371c9d4SSatish Balay ai++; 3096e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3097985db425SBarry Smith atmp = PetscAbsScalar(*aa); 30989371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 30999371c9d4SSatish Balay x[i] = atmp; 31009371c9d4SSatish Balay if (idx) idx[i] = *aj; 31019371c9d4SSatish Balay } 31029371c9d4SSatish Balay aa++; 31039371c9d4SSatish Balay aj++; 3104985db425SBarry Smith } 3105985db425SBarry Smith } 31069566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3109985db425SBarry Smith } 3110985db425SBarry Smith 3111eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3112eede4a3fSMark Adams { 3113eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3114eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3115eede4a3fSMark Adams PetscScalar *x; 3116eede4a3fSMark Adams const MatScalar *aa, *av; 3117eede4a3fSMark Adams 3118eede4a3fSMark Adams PetscFunctionBegin; 3119eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3120eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3121eede4a3fSMark Adams aa = av; 3122eede4a3fSMark Adams ai = a->i; 3123eede4a3fSMark Adams 3124eede4a3fSMark Adams PetscCall(VecSet(v, 0.0)); 3125eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3126eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3127eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3128eede4a3fSMark Adams for (i = 0; i < m; i++) { 3129eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3130eede4a3fSMark Adams ai++; 3131eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3132eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3133eede4a3fSMark Adams aa++; 3134eede4a3fSMark Adams } 3135eede4a3fSMark Adams } 3136eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3137eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3138eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3139eede4a3fSMark Adams } 3140eede4a3fSMark Adams 3141ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3142d71ae5a4SJacob Faibussowitsch { 3143985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3144d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3145985db425SBarry Smith PetscScalar *x; 3146ce496241SStefano Zampini const MatScalar *aa, *av; 3147985db425SBarry Smith 3148985db425SBarry Smith PetscFunctionBegin; 314928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3151ce496241SStefano Zampini aa = av; 3152985db425SBarry Smith ai = a->i; 3153985db425SBarry Smith aj = a->j; 3154985db425SBarry Smith 31559566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31569566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31579566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 315808401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3159985db425SBarry Smith for (i = 0; i < m; i++) { 31609371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31619371c9d4SSatish Balay ai++; 3162d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31639371c9d4SSatish Balay x[i] = *aa; 31649371c9d4SSatish Balay if (idx) idx[i] = 0; 3165985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3166985db425SBarry Smith x[i] = 0.0; 3167985db425SBarry Smith if (idx) { 3168985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3169985db425SBarry Smith if (aj[j] > j) { 3170985db425SBarry Smith idx[i] = j; 3171985db425SBarry Smith break; 3172985db425SBarry Smith } 3173985db425SBarry Smith } 31741a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31751a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3176985db425SBarry Smith } 3177985db425SBarry Smith } 3178985db425SBarry Smith for (j = 0; j < ncols; j++) { 31799371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31809371c9d4SSatish Balay x[i] = *aa; 31819371c9d4SSatish Balay if (idx) idx[i] = *aj; 31829371c9d4SSatish Balay } 31839371c9d4SSatish Balay aa++; 31849371c9d4SSatish Balay aj++; 3185985db425SBarry Smith } 3186985db425SBarry Smith } 31879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3190985db425SBarry Smith } 3191985db425SBarry Smith 3192ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3193d71ae5a4SJacob Faibussowitsch { 3194c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3195c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3196ce496241SStefano Zampini PetscScalar *x; 3197ce496241SStefano Zampini const MatScalar *aa, *av; 3198c87e5d42SMatthew Knepley 3199c87e5d42SMatthew Knepley PetscFunctionBegin; 32009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3201ce496241SStefano Zampini aa = av; 3202c87e5d42SMatthew Knepley ai = a->i; 3203c87e5d42SMatthew Knepley aj = a->j; 3204c87e5d42SMatthew Knepley 32059566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32069566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32079566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 320808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3209c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32109371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32119371c9d4SSatish Balay ai++; 3212f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32139371c9d4SSatish Balay x[i] = *aa; 32149371c9d4SSatish Balay if (idx) idx[i] = 0; 3215f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3216f07e67edSHong Zhang x[i] = 0.0; 3217f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3218289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3219f07e67edSHong Zhang if (aj[j] > j) { 3220f07e67edSHong Zhang idx[i] = j; 32212205254eSKarl Rupp break; 32222205254eSKarl Rupp } 3223289a08f5SMatthew Knepley } 3224f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3225f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3226f07e67edSHong Zhang } 3227289a08f5SMatthew Knepley } 3228c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32299371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32309371c9d4SSatish Balay x[i] = *aa; 32319371c9d4SSatish Balay if (idx) idx[i] = *aj; 32329371c9d4SSatish Balay } 32339371c9d4SSatish Balay aa++; 32349371c9d4SSatish Balay aj++; 3235c87e5d42SMatthew Knepley } 3236c87e5d42SMatthew Knepley } 32379566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3240c87e5d42SMatthew Knepley } 3241c87e5d42SMatthew Knepley 3242ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3243d71ae5a4SJacob Faibussowitsch { 3244985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3245d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3246d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3247985db425SBarry Smith PetscScalar *x; 3248ce496241SStefano Zampini const MatScalar *aa, *av; 3249985db425SBarry Smith 3250985db425SBarry Smith PetscFunctionBegin; 325128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3253ce496241SStefano Zampini aa = av; 3254985db425SBarry Smith ai = a->i; 3255985db425SBarry Smith aj = a->j; 3256985db425SBarry Smith 32579566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32589566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32599566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 326008401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3261985db425SBarry Smith for (i = 0; i < m; i++) { 32629371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32639371c9d4SSatish Balay ai++; 3264d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32659371c9d4SSatish Balay x[i] = *aa; 32669371c9d4SSatish Balay if (idx) idx[i] = 0; 3267985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3268985db425SBarry Smith x[i] = 0.0; 3269985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3270985db425SBarry Smith for (j = 0; j < ncols; j++) { 3271985db425SBarry Smith if (aj[j] > j) { 3272985db425SBarry Smith idx[i] = j; 3273985db425SBarry Smith break; 3274985db425SBarry Smith } 3275985db425SBarry Smith } 3276fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3277fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3278985db425SBarry Smith } 3279985db425SBarry Smith } 3280985db425SBarry Smith for (j = 0; j < ncols; j++) { 32819371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32829371c9d4SSatish Balay x[i] = *aa; 32839371c9d4SSatish Balay if (idx) idx[i] = *aj; 32849371c9d4SSatish Balay } 32859371c9d4SSatish Balay aa++; 32869371c9d4SSatish Balay aj++; 3287e34fafa9SBarry Smith } 3288e34fafa9SBarry Smith } 32899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3292e34fafa9SBarry Smith } 3293bbead8a2SBarry Smith 3294ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3295d71ae5a4SJacob Faibussowitsch { 3296bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 329733d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3298bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32990da83c2eSBarry Smith const PetscReal shift = 0.0; 33001a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3301bbead8a2SBarry Smith 3302bbead8a2SBarry Smith PetscFunctionBegin; 3303a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33044a0d0026SBarry Smith if (a->ibdiagvalid) { 33054a0d0026SBarry Smith if (values) *values = a->ibdiag; 33063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33074a0d0026SBarry Smith } 33089566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33094dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3310bbead8a2SBarry Smith diag = a->ibdiag; 3311bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3312bbead8a2SBarry Smith /* factor and invert each block */ 3313bbead8a2SBarry Smith switch (bs) { 3314bbead8a2SBarry Smith case 1: 3315bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33169566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3317ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3318ec1892c8SHong Zhang if (allowzeropivot) { 33197b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33207b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33217b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33229566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 332398921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3324ec1892c8SHong Zhang } 3325bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3326bbead8a2SBarry Smith } 3327bbead8a2SBarry Smith break; 3328bbead8a2SBarry Smith case 2: 3329bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33309371c9d4SSatish Balay ij[0] = 2 * i; 33319371c9d4SSatish Balay ij[1] = 2 * i + 1; 33329566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33347b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3336bbead8a2SBarry Smith diag += 4; 3337bbead8a2SBarry Smith } 3338bbead8a2SBarry Smith break; 3339bbead8a2SBarry Smith case 3: 3340bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33419371c9d4SSatish Balay ij[0] = 3 * i; 33429371c9d4SSatish Balay ij[1] = 3 * i + 1; 33439371c9d4SSatish Balay ij[2] = 3 * i + 2; 33449566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33467b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3348bbead8a2SBarry Smith diag += 9; 3349bbead8a2SBarry Smith } 3350bbead8a2SBarry Smith break; 3351bbead8a2SBarry Smith case 4: 3352bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33539371c9d4SSatish Balay ij[0] = 4 * i; 33549371c9d4SSatish Balay ij[1] = 4 * i + 1; 33559371c9d4SSatish Balay ij[2] = 4 * i + 2; 33569371c9d4SSatish Balay ij[3] = 4 * i + 3; 33579566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33597b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3361bbead8a2SBarry Smith diag += 16; 3362bbead8a2SBarry Smith } 3363bbead8a2SBarry Smith break; 3364bbead8a2SBarry Smith case 5: 3365bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33669371c9d4SSatish Balay ij[0] = 5 * i; 33679371c9d4SSatish Balay ij[1] = 5 * i + 1; 33689371c9d4SSatish Balay ij[2] = 5 * i + 2; 33699371c9d4SSatish Balay ij[3] = 5 * i + 3; 33709371c9d4SSatish Balay ij[4] = 5 * i + 4; 33719566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33737b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3375bbead8a2SBarry Smith diag += 25; 3376bbead8a2SBarry Smith } 3377bbead8a2SBarry Smith break; 3378bbead8a2SBarry Smith case 6: 3379bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33809371c9d4SSatish Balay ij[0] = 6 * i; 33819371c9d4SSatish Balay ij[1] = 6 * i + 1; 33829371c9d4SSatish Balay ij[2] = 6 * i + 2; 33839371c9d4SSatish Balay ij[3] = 6 * i + 3; 33849371c9d4SSatish Balay ij[4] = 6 * i + 4; 33859371c9d4SSatish Balay ij[5] = 6 * i + 5; 33869566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33887b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3390bbead8a2SBarry Smith diag += 36; 3391bbead8a2SBarry Smith } 3392bbead8a2SBarry Smith break; 3393bbead8a2SBarry Smith case 7: 3394bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33959371c9d4SSatish Balay ij[0] = 7 * i; 33969371c9d4SSatish Balay ij[1] = 7 * i + 1; 33979371c9d4SSatish Balay ij[2] = 7 * i + 2; 33989371c9d4SSatish Balay ij[3] = 7 * i + 3; 33999371c9d4SSatish Balay ij[4] = 7 * i + 4; 34009371c9d4SSatish Balay ij[5] = 7 * i + 5; 3401cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34029566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34047b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3406bbead8a2SBarry Smith diag += 49; 3407bbead8a2SBarry Smith } 3408bbead8a2SBarry Smith break; 3409bbead8a2SBarry Smith default: 34109566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3411bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3412ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34139566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34149566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34157b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3417bbead8a2SBarry Smith diag += bs2; 3418bbead8a2SBarry Smith } 34199566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3420bbead8a2SBarry Smith } 3421bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3423bbead8a2SBarry Smith } 3424bbead8a2SBarry Smith 3425d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3426d71ae5a4SJacob Faibussowitsch { 342773a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3428fff043a9SJunchao Zhang PetscScalar a, *aa; 342973a71a0fSBarry Smith PetscInt m, n, i, j, col; 343073a71a0fSBarry Smith 343173a71a0fSBarry Smith PetscFunctionBegin; 343273a71a0fSBarry Smith if (!x->assembled) { 34339566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 343473a71a0fSBarry Smith for (i = 0; i < m; i++) { 343573a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34369566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 343773a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34389566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 343973a71a0fSBarry Smith } 344073a71a0fSBarry Smith } 3441e2ce353bSJunchao Zhang } else { 34429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34439566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3445e2ce353bSJunchao Zhang } 34469566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34479566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 344973a71a0fSBarry Smith } 345073a71a0fSBarry Smith 3451679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3452d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3453d71ae5a4SJacob Faibussowitsch { 3454679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3455679944adSJunchao Zhang PetscScalar a; 3456679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3457679944adSJunchao Zhang 3458679944adSJunchao Zhang PetscFunctionBegin; 3459679944adSJunchao Zhang nskip = high - low; 34609566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3461679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3462679944adSJunchao Zhang for (i = 0; i < m; i++) { 3463679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34649566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3465679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3466679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34679566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3468679944adSJunchao Zhang } 3469e2ce353bSJunchao Zhang } 34709566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34719566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3473679944adSJunchao Zhang } 3474679944adSJunchao Zhang 34750a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3476cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3477cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3478cb5b572fSBarry Smith MatMult_SeqAIJ, 347997304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34807c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34817c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3482f4259b30SLisandro Dalcin NULL, 3483f4259b30SLisandro Dalcin NULL, 3484f4259b30SLisandro Dalcin NULL, 3485f4259b30SLisandro Dalcin /* 10*/ NULL, 3486cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3487f4259b30SLisandro Dalcin NULL, 348841f059aeSBarry Smith MatSOR_SeqAIJ, 348991e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349097304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3491cb5b572fSBarry Smith MatEqual_SeqAIJ, 3492cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3493cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3494cb5b572fSBarry Smith MatNorm_SeqAIJ, 3495f4259b30SLisandro Dalcin /* 20*/ NULL, 3496cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3497cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3498cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3499d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 350426cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 3512cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35157dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3516cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3517cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3518cb5b572fSBarry Smith MatCopy_SeqAIJ, 3519d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3520cb5b572fSBarry Smith MatScale_SeqAIJ, 35217d68702bSBarry Smith MatShift_SeqAIJ, 352279299369SBarry Smith MatDiagonalSet_SeqAIJ, 35236e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352473a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35253b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35263b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35273b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3528a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352993dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin NULL, 3532cda55fadSBarry Smith MatPermute_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin /* 59*/ NULL, 3535b9b97703SBarry Smith MatDestroy_SeqAIJ, 3536b9b97703SBarry Smith MatView_SeqAIJ, 3537f4259b30SLisandro Dalcin NULL, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin /* 64*/ NULL, 3540321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin NULL, 3543f4259b30SLisandro Dalcin NULL, 3544d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3545c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin /* 74*/ NULL, 35503acb8795SBarry Smith MatFDColoringApply_AIJ, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 35546ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557f4259b30SLisandro Dalcin NULL, 3558bc011b1eSHong Zhang MatLoad_SeqAIJ, 35596cff0a6bSPierre Jolivet /* 84*/ NULL, 35606cff0a6bSPierre Jolivet NULL, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin /* 89*/ NULL, 3565f4259b30SLisandro Dalcin NULL, 356626be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 35698fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 35726fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 35744222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin NULL, 357787d4246cSBarry Smith MatConjugate_SeqAIJ, 3578f4259b30SLisandro Dalcin NULL, 3579d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 358099cafbc1SBarry Smith MatRealPart_SeqAIJ, 3581f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 3584cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3585f4259b30SLisandro Dalcin NULL, 35862af78befSBarry Smith MatGetRowMin_SeqAIJ, 3587f4259b30SLisandro Dalcin NULL, 3588599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3589f4259b30SLisandro Dalcin /*114*/ NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin NULL, 3592f4259b30SLisandro Dalcin NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin /*119*/ NULL, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin NULL, 3597f4259b30SLisandro Dalcin NULL, 3598b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35990716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3600a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360137868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36020da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin /*129*/ NULL, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin NULL, 360775648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3608b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3609b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36102b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3611f4259b30SLisandro Dalcin NULL, 3612f4259b30SLisandro Dalcin NULL, 36133964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3614f4259b30SLisandro Dalcin /*139*/ NULL, 3615f4259b30SLisandro Dalcin NULL, 3616f4259b30SLisandro Dalcin NULL, 36173a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36189c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36194222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36204222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3621f4259b30SLisandro Dalcin NULL, 362272833a62Smarkadams4 NULL, 362372833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36242d776b49SBarry Smith NULL, 3625dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3626eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 36274cc2b5b5SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 36284cc2b5b5SPierre Jolivet NULL}; 362917ab2063SBarry Smith 3630ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3631d71ae5a4SJacob Faibussowitsch { 3632bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 363397f1f81fSBarry Smith PetscInt i, nz, n; 3634bef8e0ddSBarry Smith 3635bef8e0ddSBarry Smith PetscFunctionBegin; 3636bef8e0ddSBarry Smith nz = aij->maxnz; 3637d0f46423SBarry Smith n = mat->rmap->n; 3638ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3639bef8e0ddSBarry Smith aij->nz = nz; 3640ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3642bef8e0ddSBarry Smith } 3643bef8e0ddSBarry Smith 3644a3bb6f32SFande Kong /* 3645ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3646ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3647ddea5d60SJunchao Zhang */ 3648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3649d71ae5a4SJacob Faibussowitsch { 3650a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3651eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3652eec179cfSJacob Faibussowitsch PetscHashIter tpos; 365325b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 365425b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3655a3bb6f32SFande Kong 3656a3bb6f32SFande Kong PetscFunctionBegin; 3657a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36584f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3659a3bb6f32SFande Kong /* use a table */ 3660eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3661a3bb6f32SFande Kong ec = 0; 366225b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366325b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3664eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3665a3bb6f32SFande Kong if (!data) { 3666a3bb6f32SFande Kong /* one based table */ 3667c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3668a3bb6f32SFande Kong } 3669a3bb6f32SFande Kong } 3670a3bb6f32SFande Kong /* form array of columns we need */ 36719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3672eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3673eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3674eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3675eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3676eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3677a3bb6f32SFande Kong gid--; 3678a3bb6f32SFande Kong lid--; 3679a3bb6f32SFande Kong garray[lid] = gid; 3680a3bb6f32SFande Kong } 36819566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3682eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3683c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3684a3bb6f32SFande Kong /* compact out the extra columns in B */ 368525b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368625b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3687eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3688a3bb6f32SFande Kong lid--; 368925b670f0SStefano Zampini jj[i] = lid; 3690a3bb6f32SFande Kong } 36919566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3692eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36939566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36949566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36959566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3697a3bb6f32SFande Kong } 3698a3bb6f32SFande Kong 3699bef8e0ddSBarry Smith /*@ 3700bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3701bef8e0ddSBarry Smith in the matrix. 3702bef8e0ddSBarry Smith 3703bef8e0ddSBarry Smith Input Parameters: 370411a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3705bef8e0ddSBarry Smith - indices - the column indices 3706bef8e0ddSBarry Smith 370715091d37SBarry Smith Level: advanced 370815091d37SBarry Smith 3709bef8e0ddSBarry Smith Notes: 3710bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3711bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 371211a5261eSBarry Smith of the `MatSetValues()` operation. 3713bef8e0ddSBarry Smith 3714bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371511a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3716bef8e0ddSBarry Smith 371711a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3718bef8e0ddSBarry Smith 3719b9617806SBarry Smith The indices should start with zero, not one. 3720b9617806SBarry Smith 37211cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3722bef8e0ddSBarry Smith @*/ 3723d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3724d71ae5a4SJacob Faibussowitsch { 3725bef8e0ddSBarry Smith PetscFunctionBegin; 37260700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37274f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3728cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3730bef8e0ddSBarry Smith } 3731bef8e0ddSBarry Smith 3732ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3733d71ae5a4SJacob Faibussowitsch { 3734be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3735d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3736be6bf707SBarry Smith 3737be6bf707SBarry Smith PetscFunctionBegin; 373828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3739be6bf707SBarry Smith 3740be6bf707SBarry Smith /* allocate space for values if not already there */ 37414dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3742be6bf707SBarry Smith 3743be6bf707SBarry Smith /* copy values over */ 37449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3746be6bf707SBarry Smith } 3747be6bf707SBarry Smith 3748be6bf707SBarry Smith /*@ 374920f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3750be6bf707SBarry Smith nonlinear portion. 3751be6bf707SBarry Smith 3752c3339decSBarry Smith Logically Collect 3753be6bf707SBarry Smith 375427430b45SBarry Smith Input Parameter: 375511a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3756be6bf707SBarry Smith 375715091d37SBarry Smith Level: advanced 375815091d37SBarry Smith 37592920cce0SJacob Faibussowitsch Example Usage: 376027430b45SBarry Smith .vb 37612ef1f0ffSBarry Smith Using SNES 376227430b45SBarry Smith Create Jacobian matrix 376327430b45SBarry Smith Set linear terms into matrix 376427430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 376527430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 376627430b45SBarry Smith boundary conditions again will not change the nonzero structure 376727430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 376827430b45SBarry Smith MatStoreValues(mat); 376927430b45SBarry Smith Call SNESSetJacobian() with matrix 377027430b45SBarry Smith In your Jacobian routine 377127430b45SBarry Smith MatRetrieveValues(mat); 377227430b45SBarry Smith Set nonlinear terms in matrix 3773be6bf707SBarry Smith 377427430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 377527430b45SBarry Smith // build linear portion of Jacobian 377627430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377727430b45SBarry Smith MatStoreValues(mat); 377827430b45SBarry Smith loop over nonlinear iterations 377927430b45SBarry Smith MatRetrieveValues(mat); 378027430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 378127430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 378227430b45SBarry Smith Solve linear system with Jacobian 378327430b45SBarry Smith endloop 378427430b45SBarry Smith .ve 3785be6bf707SBarry Smith 3786be6bf707SBarry Smith Notes: 3787da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 378811a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3789be6bf707SBarry Smith calling this routine. 3790be6bf707SBarry Smith 37910c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37920c468ba9SBarry Smith and does not allocated additional space. 37930c468ba9SBarry Smith 3794fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3795be6bf707SBarry Smith @*/ 3796d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3797d71ae5a4SJacob Faibussowitsch { 3798be6bf707SBarry Smith PetscFunctionBegin; 37990700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 380028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 380128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3802cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3804be6bf707SBarry Smith } 3805be6bf707SBarry Smith 3806ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3807d71ae5a4SJacob Faibussowitsch { 3808be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3809d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3810be6bf707SBarry Smith 3811be6bf707SBarry Smith PetscFunctionBegin; 381228b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381328b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3814be6bf707SBarry Smith /* copy values over */ 38159566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3817be6bf707SBarry Smith } 3818be6bf707SBarry Smith 3819be6bf707SBarry Smith /*@ 382020f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3821be6bf707SBarry Smith 3822c3339decSBarry Smith Logically Collect 3823be6bf707SBarry Smith 38242fe279fdSBarry Smith Input Parameter: 382511a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3826be6bf707SBarry Smith 382715091d37SBarry Smith Level: advanced 382815091d37SBarry Smith 38291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3830be6bf707SBarry Smith @*/ 3831d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3832d71ae5a4SJacob Faibussowitsch { 3833be6bf707SBarry Smith PetscFunctionBegin; 38340700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383528b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 383628b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3837cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3839be6bf707SBarry Smith } 3840be6bf707SBarry Smith 38415d83a8b1SBarry Smith /*@ 384211a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38430d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 384420f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 384520f4b53cSBarry Smith (or the array `nnz`). 384617ab2063SBarry Smith 3847d083f849SBarry Smith Collective 3848db81eaa0SLois Curfman McInnes 384917ab2063SBarry Smith Input Parameters: 385011a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 385117ab2063SBarry Smith . m - number of rows 385217ab2063SBarry Smith . n - number of columns 385317ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385451c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38550298fd71SBarry Smith (possibly different for each row) or NULL 385617ab2063SBarry Smith 385717ab2063SBarry Smith Output Parameter: 3858416022c9SBarry Smith . A - the matrix 385917ab2063SBarry Smith 38602ef1f0ffSBarry Smith Options Database Keys: 38612ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38622ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38632ef1f0ffSBarry Smith 38642ef1f0ffSBarry Smith Level: intermediate 3865175b88e8SBarry Smith 3866b259b22eSLois Curfman McInnes Notes: 386777433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 386877433607SBarry Smith 38692ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 387049a6f317SBarry Smith 38712ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38722ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38730002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38742ef1f0ffSBarry Smith either one (as in Fortran) or zero. 387517ab2063SBarry Smith 387620f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38772ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 387820f4b53cSBarry Smith allocation. 387917ab2063SBarry Smith 3880682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38814fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3882682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38836c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38846c7ebb05SLois Curfman McInnes 38851cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 388617ab2063SBarry Smith @*/ 3887d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3888d71ae5a4SJacob Faibussowitsch { 38893a40ed3dSBarry Smith PetscFunctionBegin; 38909566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38919566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38929566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3895273d9f13SBarry Smith } 3896273d9f13SBarry Smith 38975d83a8b1SBarry Smith /*@ 3898273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3899273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3900273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3901273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3902273d9f13SBarry Smith 3903d083f849SBarry Smith Collective 3904273d9f13SBarry Smith 3905273d9f13SBarry Smith Input Parameters: 39061c4f3114SJed Brown + B - The matrix 3907273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3908273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39090298fd71SBarry Smith (possibly different for each row) or NULL 3910273d9f13SBarry Smith 39112ef1f0ffSBarry Smith Options Database Keys: 39122ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39132ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39142ef1f0ffSBarry Smith 39152ef1f0ffSBarry Smith Level: intermediate 39162ef1f0ffSBarry Smith 3917273d9f13SBarry Smith Notes: 39182ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 391949a6f317SBarry Smith 392011a5261eSBarry Smith The `MATSEQAIJ` format also called 39212ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3922273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3923273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3924273d9f13SBarry Smith 39252ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39262ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39272ef1f0ffSBarry Smith allocation. 3928273d9f13SBarry Smith 392911a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3930aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3931aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3932aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3933aa95bbe8SBarry Smith 393411a5261eSBarry Smith Developer Notes: 393511a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3936a96a251dSBarry Smith entries or columns indices 3937a96a251dSBarry Smith 3938273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3939273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3940273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3941273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3942273d9f13SBarry Smith 39431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3944db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3945273d9f13SBarry Smith @*/ 3946d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3947d71ae5a4SJacob Faibussowitsch { 3948a23d5eceSKris Buschelman PetscFunctionBegin; 39496ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39506ba663aaSJed Brown PetscValidType(B, 1); 3951cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3953a23d5eceSKris Buschelman } 3954a23d5eceSKris Buschelman 3955d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3956d71ae5a4SJacob Faibussowitsch { 3957ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39582576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395997f1f81fSBarry Smith PetscInt i; 3960273d9f13SBarry Smith 3961273d9f13SBarry Smith PetscFunctionBegin; 3962ad79cf63SBarry Smith if (B->hash_active) { 3963aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3964ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3965ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3966ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3967ad79cf63SBarry Smith } 39682576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3969a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3970c461c341SBarry Smith skipallocation = PETSC_TRUE; 3971c461c341SBarry Smith nz = 0; 3972c461c341SBarry Smith } 39739566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39749566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3975899cda47SBarry Smith 3976435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 397708401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 39789f0612e4SBarry Smith if (nnz) { 3979d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 398008401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 398108401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3982b73539f3SBarry Smith } 3983b73539f3SBarry Smith } 3984b73539f3SBarry Smith 3985273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3986ab93d7beSBarry Smith if (!skipallocation) { 39874dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3988071fcb05SBarry Smith if (!b->ilen) { 3989071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39909566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3991071fcb05SBarry Smith } else { 39929566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39932ee49352SLisandro Dalcin } 3994aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3995273d9f13SBarry Smith if (!nnz) { 3996435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3997c62bd62aSJed Brown else if (nz < 0) nz = 1; 39985d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3999d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4000c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4001273d9f13SBarry Smith } else { 4002c73702f5SBarry Smith PetscInt64 nz64 = 0; 40039371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40049371c9d4SSatish Balay b->imax[i] = nnz[i]; 40059371c9d4SSatish Balay nz64 += nnz[i]; 40069371c9d4SSatish Balay } 40079566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4008273d9f13SBarry Smith } 4009ab93d7beSBarry Smith 4010273d9f13SBarry Smith /* allocate the matrix space */ 40119566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 40129f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 40139f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 40149f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 4015396832f4SHong Zhang if (B->structure_only) { 40169f0612e4SBarry Smith b->free_a = PETSC_FALSE; 4017396832f4SHong Zhang } else { 40189f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 40199f0612e4SBarry Smith b->free_a = PETSC_TRUE; 4020396832f4SHong Zhang } 4021bfeeae90SHong Zhang b->i[0] = 0; 4022ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4023c461c341SBarry Smith } else { 4024e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4025e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4026c461c341SBarry Smith } 4027273d9f13SBarry Smith 4028846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4029846b4da1SFande Kong /* reserve user-requested sparsity */ 40309566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4031846b4da1SFande Kong } 4032846b4da1SFande Kong 4033273d9f13SBarry Smith b->nz = 0; 4034273d9f13SBarry Smith b->maxnz = nz; 4035273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40361baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4037cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4038cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40395519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40405519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40415519a089SJose E. Roman */ 40425519a089SJose E. Roman B->nonzerostate++; 40433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4044273d9f13SBarry Smith } 4045273d9f13SBarry Smith 4046ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4047d71ae5a4SJacob Faibussowitsch { 4048846b4da1SFande Kong Mat_SeqAIJ *a; 4049a5bbaf83SFande Kong PetscInt i; 40501f14be2bSBarry Smith PetscBool skipreset; 4051846b4da1SFande Kong 4052846b4da1SFande Kong PetscFunctionBegin; 4053846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405414d0e64fSAlex Lindsay 405514d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40563ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 405714d0e64fSAlex Lindsay 4058846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40592c814fdeSFande Kong /* if no saved info, we error out */ 406028b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40612c814fdeSFande Kong 40621f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40632c814fdeSFande Kong 40641f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40651f14be2bSBarry Smith if (!skipreset) { 40669566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40679566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4068846b4da1SFande Kong a->i[0] = 0; 4069ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4070846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4071846b4da1SFande Kong a->nz = 0; 4072846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4073846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4074846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4075846b4da1SFande Kong A->assembled = PETSC_FALSE; 40761f14be2bSBarry Smith } 40773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4078846b4da1SFande Kong } 4079846b4da1SFande Kong 408058d36128SBarry Smith /*@ 408111a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4082a1661176SMatthew Knepley 4083a1661176SMatthew Knepley Input Parameters: 4084a1661176SMatthew Knepley + B - the matrix 4085d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4086d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4087d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4088a1661176SMatthew Knepley 4089a1661176SMatthew Knepley Level: developer 4090a1661176SMatthew Knepley 40916a9b8d82SBarry Smith Notes: 40922ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 409358d36128SBarry Smith 40946a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40956a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40966a9b8d82SBarry Smith 40976a9b8d82SBarry Smith Developer Notes: 40982ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 40992ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41006a9b8d82SBarry Smith 410111a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41026a9b8d82SBarry Smith 4103fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4104a1661176SMatthew Knepley @*/ 4105d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4106d71ae5a4SJacob Faibussowitsch { 4107a1661176SMatthew Knepley PetscFunctionBegin; 41080700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41096ba663aaSJed Brown PetscValidType(B, 1); 4110cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4112a1661176SMatthew Knepley } 4113a1661176SMatthew Knepley 4114ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4115d71ae5a4SJacob Faibussowitsch { 4116a1661176SMatthew Knepley PetscInt i; 4117a1661176SMatthew Knepley PetscInt m, n; 4118a1661176SMatthew Knepley PetscInt nz; 41196a9b8d82SBarry Smith PetscInt *nnz; 4120a1661176SMatthew Knepley 4121a1661176SMatthew Knepley PetscFunctionBegin; 4122aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4123779a8d59SSatish Balay 41249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4126779a8d59SSatish Balay 41279566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4129a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4130b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 413108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4132a1661176SMatthew Knepley nnz[i] = nz; 4133a1661176SMatthew Knepley } 41349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41359566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4136a1661176SMatthew Knepley 41378e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4138a1661176SMatthew Knepley 41399566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41409566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4141a1661176SMatthew Knepley 41429566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4144a1661176SMatthew Knepley } 4145a1661176SMatthew Knepley 4146ad7e164aSPierre Jolivet /*@ 41472ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4148ad7e164aSPierre Jolivet 4149ad7e164aSPierre Jolivet Input Parameters: 4150ad7e164aSPierre Jolivet + A - left-hand side matrix 4151ad7e164aSPierre Jolivet . B - right-hand side matrix 415211a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4153ad7e164aSPierre Jolivet 4154ad7e164aSPierre Jolivet Output Parameter: 41552ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4156ad7e164aSPierre Jolivet 4157ad7e164aSPierre Jolivet Level: intermediate 4158ad7e164aSPierre Jolivet 415911a5261eSBarry Smith Note: 416011a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4161ad7e164aSPierre Jolivet 41621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4163ad7e164aSPierre Jolivet @*/ 4164d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4165d71ae5a4SJacob Faibussowitsch { 4166ad7e164aSPierre Jolivet PetscFunctionBegin; 4167ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4168ad7e164aSPierre Jolivet PetscValidType(A, 1); 4169ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4170ad7e164aSPierre Jolivet PetscValidType(B, 2); 41714f572ea9SToby Isaac PetscAssertPointer(C, 4); 4172ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4173ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4174ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4175ad7e164aSPierre Jolivet } 4176cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4178ad7e164aSPierre Jolivet } 4179ad7e164aSPierre Jolivet 4180ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4181d71ae5a4SJacob Faibussowitsch { 4182ad7e164aSPierre Jolivet Mat newmat; 4183ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4184ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4185ad7e164aSPierre Jolivet PetscScalar *v; 4186fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4187ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4188ad7e164aSPierre Jolivet PetscBool flg; 4189ad7e164aSPierre Jolivet 4190ad7e164aSPierre Jolivet PetscFunctionBegin; 419128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419228b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 419328b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419428b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 419628b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4197aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4198ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 41999566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42009566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42029566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4203ad7e164aSPierre Jolivet i[0] = 0; 4204ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4205ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4206ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4207ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4208ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4209ad7e164aSPierre Jolivet } 4210ad7e164aSPierre Jolivet } 4211ad7e164aSPierre Jolivet } 42129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4213ad7e164aSPierre Jolivet *C = newmat; 42149566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4215ad7e164aSPierre Jolivet nnz = 0; 4216ad7e164aSPierre Jolivet } 42179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4220ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4221ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4222ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4223ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4224ad7e164aSPierre Jolivet } 4225ad7e164aSPierre Jolivet } 4226ad7e164aSPierre Jolivet } 42279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4231ad7e164aSPierre Jolivet } 4232ad7e164aSPierre Jolivet 4233c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4234af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4235170fe5c8SBarry Smith 4236170fe5c8SBarry Smith /* 4237170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4238170fe5c8SBarry Smith 4239170fe5c8SBarry Smith n p p 42402da392ccSBarry Smith [ ] [ ] [ ] 42412da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42422da392ccSBarry Smith [ ] [ ] [ ] 4243170fe5c8SBarry Smith 4244170fe5c8SBarry Smith */ 4245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4246d71ae5a4SJacob Faibussowitsch { 4247170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4248170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4249170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 425086214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4251170fe5c8SBarry Smith const PetscInt *ii, *idx; 4252170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4253170fe5c8SBarry Smith PetscScalar *c, *c_q; 425486214ceeSStefano Zampini PetscInt clda = sub_c->lda; 425586214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4256170fe5c8SBarry Smith 4257170fe5c8SBarry Smith PetscFunctionBegin; 4258d0f46423SBarry Smith m = A->rmap->n; 4259d0f46423SBarry Smith n = A->cmap->n; 4260d0f46423SBarry Smith p = B->cmap->n; 4261170fe5c8SBarry Smith a = sub_a->v; 4262170fe5c8SBarry Smith b = sub_b->a; 4263170fe5c8SBarry Smith c = sub_c->v; 426486214ceeSStefano Zampini if (clda == m) { 42659566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 426686214ceeSStefano Zampini } else { 426786214ceeSStefano Zampini for (j = 0; j < p; j++) 42689371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 426986214ceeSStefano Zampini } 4270170fe5c8SBarry Smith ii = sub_b->i; 4271170fe5c8SBarry Smith idx = sub_b->j; 4272170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4273170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4274170fe5c8SBarry Smith while (q-- > 0) { 427586214ceeSStefano Zampini c_q = c + clda * (*idx); 427686214ceeSStefano Zampini a_q = a + alda * i; 4277854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4278170fe5c8SBarry Smith idx++; 4279170fe5c8SBarry Smith b++; 4280170fe5c8SBarry Smith } 4281170fe5c8SBarry Smith } 42823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4283170fe5c8SBarry Smith } 4284170fe5c8SBarry Smith 4285d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4286d71ae5a4SJacob Faibussowitsch { 4287d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 428886214ceeSStefano Zampini PetscBool cisdense; 4289170fe5c8SBarry Smith 4290170fe5c8SBarry Smith PetscFunctionBegin; 429108401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42929566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42939566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4294d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 429548a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42969566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4297d73949e8SHong Zhang 42984222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 42993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4300170fe5c8SBarry Smith } 4301170fe5c8SBarry Smith 43020bad9183SKris Buschelman /*MC 4303fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43040bad9183SKris Buschelman based on compressed sparse row format. 43050bad9183SKris Buschelman 43062ef1f0ffSBarry Smith Options Database Key: 43070bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43080bad9183SKris Buschelman 43090bad9183SKris Buschelman Level: beginner 43100bad9183SKris Buschelman 43110cd7f59aSBarry Smith Notes: 43122ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43130cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43140cd7f59aSBarry Smith in the matrix 43150cd7f59aSBarry Smith 431611a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 431711a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43180cd7f59aSBarry Smith 431911a5261eSBarry Smith Developer Note: 43202ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43210cd7f59aSBarry Smith 43221cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43230bad9183SKris Buschelman M*/ 43240bad9183SKris Buschelman 4325ccd284c7SBarry Smith /*MC 4326ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4327ccd284c7SBarry Smith 432811a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 432911a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 433011a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4331ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4332ccd284c7SBarry Smith the above preallocation routines for simplicity. 4333ccd284c7SBarry Smith 43342ef1f0ffSBarry Smith Options Database Key: 433511a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4336ccd284c7SBarry Smith 43372ef1f0ffSBarry Smith Level: beginner 43382ef1f0ffSBarry Smith 433911a5261eSBarry Smith Note: 434011a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4341ccd284c7SBarry Smith enough exist. 4342ccd284c7SBarry Smith 43431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4344ccd284c7SBarry Smith M*/ 4345ccd284c7SBarry Smith 4346ccd284c7SBarry Smith /*MC 4347ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4348ccd284c7SBarry Smith 43492ef1f0ffSBarry Smith Options Database Key: 43502ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43512ef1f0ffSBarry Smith 43522ef1f0ffSBarry Smith Level: beginner 43532ef1f0ffSBarry Smith 43542ef1f0ffSBarry Smith Note: 435511a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 435611a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 435711a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4358ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4359ccd284c7SBarry Smith the above preallocation routines for simplicity. 4360ccd284c7SBarry Smith 43611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4362ccd284c7SBarry Smith M*/ 4363ccd284c7SBarry Smith 43647906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43657906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43667906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43677906f579SHong Zhang #endif 4368d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4369d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4370d24d4204SJose E. Roman #endif 43717906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43727906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43737906f579SHong Zhang #endif 43747906f579SHong Zhang 4375d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4376c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43774222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43787906f579SHong Zhang 43798c778c55SBarry Smith /*@C 438011a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43818c778c55SBarry Smith 43828c778c55SBarry Smith Not Collective 43838c778c55SBarry Smith 43848c778c55SBarry Smith Input Parameter: 4385fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43868c778c55SBarry Smith 43878c778c55SBarry Smith Output Parameter: 43888c778c55SBarry Smith . array - pointer to the data 43898c778c55SBarry Smith 43908c778c55SBarry Smith Level: intermediate 43918c778c55SBarry Smith 4392fe59aa6dSJacob Faibussowitsch Fortran Notes: 43930ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 43940ab4885dSBarry Smith 43951cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43968c778c55SBarry Smith @*/ 43975d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4398d71ae5a4SJacob Faibussowitsch { 4399d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44008c778c55SBarry Smith 44018c778c55SBarry Smith PetscFunctionBegin; 4402d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44039566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4404d67d9f35SJunchao Zhang } else { 4405d67d9f35SJunchao Zhang *array = aij->a; 4406d67d9f35SJunchao Zhang } 44073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4408d67d9f35SJunchao Zhang } 4409d67d9f35SJunchao Zhang 4410d67d9f35SJunchao Zhang /*@C 441111a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4412d67d9f35SJunchao Zhang 4413d67d9f35SJunchao Zhang Not Collective 4414d67d9f35SJunchao Zhang 4415d67d9f35SJunchao Zhang Input Parameters: 4416fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4417d67d9f35SJunchao Zhang - array - pointer to the data 4418d67d9f35SJunchao Zhang 4419d67d9f35SJunchao Zhang Level: intermediate 4420d67d9f35SJunchao Zhang 4421fe59aa6dSJacob Faibussowitsch Fortran Notes: 44220ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44230ab4885dSBarry Smith 44241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4425d67d9f35SJunchao Zhang @*/ 44265d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4427d71ae5a4SJacob Faibussowitsch { 4428d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4429d67d9f35SJunchao Zhang 4430d67d9f35SJunchao Zhang PetscFunctionBegin; 4431d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44329566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4433d67d9f35SJunchao Zhang } else { 4434d67d9f35SJunchao Zhang *array = NULL; 4435d67d9f35SJunchao Zhang } 44369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44379566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44398c778c55SBarry Smith } 44408c778c55SBarry Smith 444121e72a00SBarry Smith /*@C 444211a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44438f1ea47aSStefano Zampini 44440ab4885dSBarry Smith Not Collective; No Fortran Support 44458f1ea47aSStefano Zampini 44468f1ea47aSStefano Zampini Input Parameter: 4447fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44488f1ea47aSStefano Zampini 44498f1ea47aSStefano Zampini Output Parameter: 44508f1ea47aSStefano Zampini . array - pointer to the data 44518f1ea47aSStefano Zampini 44528f1ea47aSStefano Zampini Level: intermediate 44538f1ea47aSStefano Zampini 44541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44558f1ea47aSStefano Zampini @*/ 44565d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4457d71ae5a4SJacob Faibussowitsch { 4458d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44598f1ea47aSStefano Zampini 44608f1ea47aSStefano Zampini PetscFunctionBegin; 4461d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44629566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4463d67d9f35SJunchao Zhang } else { 4464d67d9f35SJunchao Zhang *array = aij->a; 4465d67d9f35SJunchao Zhang } 44663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44678f1ea47aSStefano Zampini } 44688f1ea47aSStefano Zampini 44698f1ea47aSStefano Zampini /*@C 447011a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44718f1ea47aSStefano Zampini 44720ab4885dSBarry Smith Not Collective; No Fortran Support 44738f1ea47aSStefano Zampini 44748f1ea47aSStefano Zampini Input Parameter: 4475fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44768f1ea47aSStefano Zampini 44778f1ea47aSStefano Zampini Output Parameter: 44788f1ea47aSStefano Zampini . array - pointer to the data 44798f1ea47aSStefano Zampini 44808f1ea47aSStefano Zampini Level: intermediate 44818f1ea47aSStefano Zampini 44821cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44838f1ea47aSStefano Zampini @*/ 44845d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4485d71ae5a4SJacob Faibussowitsch { 4486d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44878f1ea47aSStefano Zampini 44888f1ea47aSStefano Zampini PetscFunctionBegin; 4489d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44909566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4491d67d9f35SJunchao Zhang } else { 4492d67d9f35SJunchao Zhang *array = NULL; 4493d67d9f35SJunchao Zhang } 44943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4495d67d9f35SJunchao Zhang } 4496d67d9f35SJunchao Zhang 4497d67d9f35SJunchao Zhang /*@C 449811a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4499d67d9f35SJunchao Zhang 45000ab4885dSBarry Smith Not Collective; No Fortran Support 4501d67d9f35SJunchao Zhang 4502d67d9f35SJunchao Zhang Input Parameter: 4503fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4504d67d9f35SJunchao Zhang 4505d67d9f35SJunchao Zhang Output Parameter: 4506d67d9f35SJunchao Zhang . array - pointer to the data 4507d67d9f35SJunchao Zhang 4508d67d9f35SJunchao Zhang Level: intermediate 4509d67d9f35SJunchao Zhang 45101cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4511d67d9f35SJunchao Zhang @*/ 45125d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4513d71ae5a4SJacob Faibussowitsch { 4514d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4515d67d9f35SJunchao Zhang 4516d67d9f35SJunchao Zhang PetscFunctionBegin; 4517d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45189566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4519d67d9f35SJunchao Zhang } else { 4520d67d9f35SJunchao Zhang *array = aij->a; 4521d67d9f35SJunchao Zhang } 45229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45239566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4525d67d9f35SJunchao Zhang } 4526d67d9f35SJunchao Zhang 4527d67d9f35SJunchao Zhang /*@C 4528d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4529d67d9f35SJunchao Zhang 45300ab4885dSBarry Smith Not Collective; No Fortran Support 4531d67d9f35SJunchao Zhang 4532d67d9f35SJunchao Zhang Input Parameter: 4533fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4534d67d9f35SJunchao Zhang 4535d67d9f35SJunchao Zhang Output Parameter: 4536d67d9f35SJunchao Zhang . array - pointer to the data 4537d67d9f35SJunchao Zhang 4538d67d9f35SJunchao Zhang Level: intermediate 4539d67d9f35SJunchao Zhang 45401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4541d67d9f35SJunchao Zhang @*/ 45425d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4543d71ae5a4SJacob Faibussowitsch { 4544d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4545d67d9f35SJunchao Zhang 4546d67d9f35SJunchao Zhang PetscFunctionBegin; 4547d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45489566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4549d67d9f35SJunchao Zhang } else { 4550d67d9f35SJunchao Zhang *array = NULL; 4551d67d9f35SJunchao Zhang } 45523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45538f1ea47aSStefano Zampini } 45548f1ea47aSStefano Zampini 45558f1ea47aSStefano Zampini /*@C 455611a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45577ee59b9bSJunchao Zhang 45580ab4885dSBarry Smith Not Collective; No Fortran Support 45597ee59b9bSJunchao Zhang 45607ee59b9bSJunchao Zhang Input Parameter: 456111a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45627ee59b9bSJunchao Zhang 45637ee59b9bSJunchao Zhang Output Parameters: 45647ee59b9bSJunchao Zhang + i - row map array of the matrix 45657ee59b9bSJunchao Zhang . j - column index array of the matrix 45667ee59b9bSJunchao Zhang . a - data array of the matrix 4567fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45687ee59b9bSJunchao Zhang 4569fe59aa6dSJacob Faibussowitsch Level: developer 45702ef1f0ffSBarry Smith 45717ee59b9bSJunchao Zhang Notes: 45722ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45737ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45747ee59b9bSJunchao Zhang 45757ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45762ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45777ee59b9bSJunchao Zhang 45781cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45797ee59b9bSJunchao Zhang @*/ 45805d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4581d71ae5a4SJacob Faibussowitsch { 45827ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45837ee59b9bSJunchao Zhang 45847ee59b9bSJunchao Zhang PetscFunctionBegin; 45857ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45867ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45877ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45887ee59b9bSJunchao Zhang } else { 45897ee59b9bSJunchao Zhang if (i) *i = aij->i; 45907ee59b9bSJunchao Zhang if (j) *j = aij->j; 45917ee59b9bSJunchao Zhang if (a) *a = aij->a; 45927ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45937ee59b9bSJunchao Zhang } 45943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45957ee59b9bSJunchao Zhang } 45967ee59b9bSJunchao Zhang 4597cc4c1da9SBarry Smith /*@ 459821e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 459921e72a00SBarry Smith 460021e72a00SBarry Smith Not Collective 460121e72a00SBarry Smith 460221e72a00SBarry Smith Input Parameter: 4603fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 460421e72a00SBarry Smith 460521e72a00SBarry Smith Output Parameter: 460621e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 460721e72a00SBarry Smith 460821e72a00SBarry Smith Level: intermediate 460921e72a00SBarry Smith 46101cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 461121e72a00SBarry Smith @*/ 4612d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4613d71ae5a4SJacob Faibussowitsch { 461421e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 461521e72a00SBarry Smith 461621e72a00SBarry Smith PetscFunctionBegin; 461721e72a00SBarry Smith *nz = aij->rmax; 46183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 461921e72a00SBarry Smith } 462021e72a00SBarry Smith 46212c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46222c4ab24aSJunchao Zhang { 46232c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46244d86920dSPierre Jolivet 46252c4ab24aSJunchao Zhang PetscFunctionBegin; 46262c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46272c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46282c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46292c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46302c4ab24aSJunchao Zhang } 46312c4ab24aSJunchao Zhang 4632d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4633d71ae5a4SJacob Faibussowitsch { 4634394ed5ebSJunchao Zhang MPI_Comm comm; 4635394ed5ebSJunchao Zhang PetscInt *i, *j; 46360d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4637394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4638394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4639394ed5ebSJunchao Zhang PetscInt *Aj; 4640394ed5ebSJunchao Zhang PetscScalar *Aa; 4641f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4642cbc6b225SStefano Zampini MatType rtype; 4643394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46442c4ab24aSJunchao Zhang PetscContainer container; 46452c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46460d88f7f4SJunchao Zhang PetscBool isorted; 46479f0612e4SBarry Smith PetscBool hypre; 46489f0612e4SBarry Smith const char *name; 4649394ed5ebSJunchao Zhang 4650394ed5ebSJunchao Zhang PetscFunctionBegin; 46519566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46529566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4653e8729f6fSJunchao Zhang i = coo_i; 4654e8729f6fSJunchao Zhang j = coo_j; 46559566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46560d88f7f4SJunchao Zhang 46570d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46580d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46590d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46600d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4661394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46620d88f7f4SJunchao Zhang if (isorted) { 46630d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46640d88f7f4SJunchao Zhang else iprev = i[k]; 46650d88f7f4SJunchao Zhang } 4666394ed5ebSJunchao Zhang perm[k] = k; 4667394ed5ebSJunchao Zhang } 4668394ed5ebSJunchao Zhang 46690d88f7f4SJunchao Zhang /* Sort by row if not already */ 46700d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4671651b1cf9SStefano Zampini 4672651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4673651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46749371c9d4SSatish Balay if (i[k] >= 0) break; 4675394ed5ebSJunchao Zhang nneg = k; 46769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4677394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 467835cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4679394ed5ebSJunchao Zhang 46809f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 46819f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 46829f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4683394ed5ebSJunchao Zhang 4684651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4685651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4686651b1cf9SStefano Zampini 4687394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 468835cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4689394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4690394ed5ebSJunchao Zhang while (k < coo_n) { 46910d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 46920d88f7f4SJunchao Zhang PetscInt jprev; 46930d88f7f4SJunchao Zhang 46940d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4695394ed5ebSJunchao Zhang row = i[k]; 46960d88f7f4SJunchao Zhang start = k; 46970d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 46980d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 46990d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47000d88f7f4SJunchao Zhang if (strictly_sorted) { 47010d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47020d88f7f4SJunchao Zhang else jprev = j[k]; 47030d88f7f4SJunchao Zhang } 47040d88f7f4SJunchao Zhang k++; 47050d88f7f4SJunchao Zhang } 4706394ed5ebSJunchao Zhang end = k; 47070d88f7f4SJunchao Zhang 4708651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4709651b1cf9SStefano Zampini if (hypre) { 4710*1690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4711651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47120d88f7f4SJunchao Zhang 47130d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47140d88f7f4SJunchao Zhang PetscCount tmp; 47150d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47160d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47170d88f7f4SJunchao Zhang j[p] = j[start]; 47180d88f7f4SJunchao Zhang j[start] = row; 47190d88f7f4SJunchao Zhang tmp = perm[start]; 47200d88f7f4SJunchao Zhang perm[start] = perm[p]; 47210d88f7f4SJunchao Zhang perm[p] = tmp; 47220d88f7f4SJunchao Zhang break; 47230d88f7f4SJunchao Zhang } 47240d88f7f4SJunchao Zhang } 47250d88f7f4SJunchao Zhang } else { 4726651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4727651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4728651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4729651b1cf9SStefano Zampini } 47300d88f7f4SJunchao Zhang 4731651b1cf9SStefano Zampini if (hasdiag) { 4732651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4733651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4734651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4735651b1cf9SStefano Zampini } 4736651b1cf9SStefano Zampini } 4737651b1cf9SStefano Zampini } 47380d88f7f4SJunchao Zhang } 47390d88f7f4SJunchao Zhang // sort by columns in a row 47400d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4741651b1cf9SStefano Zampini 47420d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47430d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47440d88f7f4SJunchao Zhang Aj[q] = j[p]; 47450d88f7f4SJunchao Zhang jmap[q] = 1; 47460d88f7f4SJunchao Zhang } 47476497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 47480d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47490d88f7f4SJunchao Zhang } else { 4750394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4751394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4752651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4753394ed5ebSJunchao Zhang Ai[row] = 1; 4754394ed5ebSJunchao Zhang nnz++; 4755394ed5ebSJunchao Zhang 4756394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4757394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4758394ed5ebSJunchao Zhang q++; 4759394ed5ebSJunchao Zhang jmap[q] = 1; 4760394ed5ebSJunchao Zhang Aj[q] = j[p]; 4761394ed5ebSJunchao Zhang Ai[row]++; 4762394ed5ebSJunchao Zhang nnz++; 4763394ed5ebSJunchao Zhang } else { 4764394ed5ebSJunchao Zhang jmap[q]++; 4765394ed5ebSJunchao Zhang } 4766394ed5ebSJunchao Zhang } 4767394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4768394ed5ebSJunchao Zhang } 47690d88f7f4SJunchao Zhang } 47700d88f7f4SJunchao Zhang 4771394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4772394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47730d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4774394ed5ebSJunchao Zhang jmap[0] = 0; 4775394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47760d88f7f4SJunchao Zhang 47779f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4778394ed5ebSJunchao Zhang PetscCount *jmap_new; 4779394ed5ebSJunchao Zhang PetscInt *Aj_new; 4780394ed5ebSJunchao Zhang 47819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47829566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47839566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4784394ed5ebSJunchao Zhang jmap = jmap_new; 4785394ed5ebSJunchao Zhang 47869f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 47879566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47889f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4789394ed5ebSJunchao Zhang Aj = Aj_new; 4790394ed5ebSJunchao Zhang } 4791394ed5ebSJunchao Zhang 4792394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4793394ed5ebSJunchao Zhang PetscCount *perm_new; 4794cbc6b225SStefano Zampini 47959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47969566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47979566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4798394ed5ebSJunchao Zhang perm = perm_new; 4799394ed5ebSJunchao Zhang } 4800394ed5ebSJunchao Zhang 48019566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48029f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 48039f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 48049566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4805394ed5ebSJunchao Zhang 4806394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48072c4ab24aSJunchao Zhang 48082c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48092c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48106497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 48112c4ab24aSJunchao Zhang coo->n = coo_n; 48122c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48132c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48142c4ab24aSJunchao Zhang coo->perm = perm; 48152c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 48162c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 48172c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 48182c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 48192c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 48203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4821394ed5ebSJunchao Zhang } 4822394ed5ebSJunchao Zhang 4823d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4824d71ae5a4SJacob Faibussowitsch { 4825394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4826394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48272c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4828394ed5ebSJunchao Zhang PetscScalar *Aa; 48292c4ab24aSJunchao Zhang PetscContainer container; 48302c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4831394ed5ebSJunchao Zhang 4832394ed5ebSJunchao Zhang PetscFunctionBegin; 48332c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48342c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48352c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48362c4ab24aSJunchao Zhang perm = coo->perm; 48372c4ab24aSJunchao Zhang jmap = coo->jmap; 48389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4839394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4840b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4841b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4842b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4843394ed5ebSJunchao Zhang } 48449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4846394ed5ebSJunchao Zhang } 4847394ed5ebSJunchao Zhang 484834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48495063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 485002fe1965SBarry Smith #endif 4851d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4852d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4853d5e393b6SSuyash Tandon #endif 48543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48555063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48563d0639e7SStefano Zampini #endif 485702fe1965SBarry Smith 4858d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4859d71ae5a4SJacob Faibussowitsch { 4860273d9f13SBarry Smith Mat_SeqAIJ *b; 486138baddfdSBarry Smith PetscMPIInt size; 4862273d9f13SBarry Smith 4863273d9f13SBarry Smith PetscFunctionBegin; 48649566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 486508401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4866273d9f13SBarry Smith 48674dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48682205254eSKarl Rupp 4869b0a32e0cSBarry Smith B->data = (void *)b; 4870aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4871071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48722205254eSKarl Rupp 4873f4259b30SLisandro Dalcin b->row = NULL; 4874f4259b30SLisandro Dalcin b->col = NULL; 4875f4259b30SLisandro Dalcin b->icol = NULL; 4876b810aeb4SBarry Smith b->reallocs = 0; 487736db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4878f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4879416022c9SBarry Smith b->nonew = 0; 4880f4259b30SLisandro Dalcin b->diag = NULL; 4881f4259b30SLisandro Dalcin b->solve_work = NULL; 4882f4259b30SLisandro Dalcin B->spptr = NULL; 4883f4259b30SLisandro Dalcin b->saved_values = NULL; 4884f4259b30SLisandro Dalcin b->idiag = NULL; 4885f4259b30SLisandro Dalcin b->mdiag = NULL; 4886f4259b30SLisandro Dalcin b->ssor_work = NULL; 488771f1c65dSBarry Smith b->omega = 1.0; 488871f1c65dSBarry Smith b->fshift = 0.0; 488971f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4890bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4891a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 489217ab2063SBarry Smith 48939566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4894d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4897b3866ffcSBarry Smith #endif 48989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49059779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4907191b95cbSRichard Tran Mills #endif 490834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 491202fe1965SBarry Smith #endif 4913d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4914d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4915d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4916d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4917d5e393b6SSuyash Tandon #endif 49183d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49199566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49203d0639e7SStefano Zampini #endif 49219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4922af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4924af8000cdSHong Zhang #endif 4925d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4927d24d4204SJose E. Roman #endif 492863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 493163c07aadSStefano Zampini #endif 49329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 493614e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49479566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 495117ab2063SBarry Smith } 495217ab2063SBarry Smith 4953b24902e0SBarry Smith /* 49543893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4955b24902e0SBarry Smith */ 4956d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4957d71ae5a4SJacob Faibussowitsch { 49582a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4959071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 496017ab2063SBarry Smith 49613a40ed3dSBarry Smith PetscFunctionBegin; 4962aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4963273d9f13SBarry Smith 4964d5f3da31SBarry Smith C->factortype = A->factortype; 4965f4259b30SLisandro Dalcin c->row = NULL; 4966f4259b30SLisandro Dalcin c->col = NULL; 4967f4259b30SLisandro Dalcin c->icol = NULL; 49686ad4291fSHong Zhang c->reallocs = 0; 4969bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 497017ab2063SBarry Smith 497169272f91SPierre Jolivet C->assembled = A->assembled; 497217ab2063SBarry Smith 497369272f91SPierre Jolivet if (A->preallocated) { 49749566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49759566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4976eec197d1SBarry Smith 497731fe6a7dSBarry Smith if (!A->hash_active) { 49789566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49799566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49819566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 498217ab2063SBarry Smith 498317ab2063SBarry Smith /* allocate the matrix space */ 4984f77e22a1SHong Zhang if (mallocmatspace) { 49859f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 49869f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 49879f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 49889566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 49899f0612e4SBarry Smith c->free_a = PETSC_TRUE; 49909f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 499117ab2063SBarry Smith if (m > 0) { 49929566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4993be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49942e5835c6SStefano Zampini const PetscScalar *aa; 49952e5835c6SStefano Zampini 49969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49979566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4999be6bf707SBarry Smith } else { 50009566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 500117ab2063SBarry Smith } 500208480c60SBarry Smith } 5003f77e22a1SHong Zhang } 500431fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 500531fe6a7dSBarry Smith } else { 500631fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 500731fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 500831fe6a7dSBarry Smith } 500917ab2063SBarry Smith 50106ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5011416022c9SBarry Smith c->roworiented = a->roworiented; 5012416022c9SBarry Smith c->nonew = a->nonew; 5013416022c9SBarry Smith if (a->diag) { 50149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50159566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5016071fcb05SBarry Smith } else c->diag = NULL; 50172205254eSKarl Rupp 5018f4259b30SLisandro Dalcin c->solve_work = NULL; 5019f4259b30SLisandro Dalcin c->saved_values = NULL; 5020f4259b30SLisandro Dalcin c->idiag = NULL; 5021f4259b30SLisandro Dalcin c->ssor_work = NULL; 5022a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 50236ad4291fSHong Zhang 5024893ad86cSHong Zhang c->rmax = a->rmax; 5025416022c9SBarry Smith c->nz = a->nz; 50268ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5027754ec7b1SSatish Balay 50286ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50296ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5030cd6b891eSBarry Smith if (a->compressedrow.use) { 50316ad4291fSHong Zhang i = a->compressedrow.nrows; 50329566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50339566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 503527ea64f8SHong Zhang } else { 503627ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50370298fd71SBarry Smith c->compressedrow.i = NULL; 50380298fd71SBarry Smith c->compressedrow.rindex = NULL; 50396ad4291fSHong Zhang } 5040ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5041e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50424846f1f5SKris Buschelman 50439566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 504469272f91SPierre Jolivet } 50459566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 504717ab2063SBarry Smith } 504817ab2063SBarry Smith 5049d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5050d71ae5a4SJacob Faibussowitsch { 5051b24902e0SBarry Smith PetscFunctionBegin; 50529566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50539566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 505448a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50559566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50569566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5058b24902e0SBarry Smith } 5059b24902e0SBarry Smith 5060d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5061d71ae5a4SJacob Faibussowitsch { 506252f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 506352f91c60SVaclav Hapla 506452f91c60SVaclav Hapla PetscFunctionBegin; 506552f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 506652f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5067c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50689566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50699566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50709566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 507152f91c60SVaclav Hapla if (isbinary) { 50729566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 507352f91c60SVaclav Hapla } else if (ishdf5) { 507452f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50759566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 507652f91c60SVaclav Hapla #else 507752f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 507852f91c60SVaclav Hapla #endif 507952f91c60SVaclav Hapla } else { 508098921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 508152f91c60SVaclav Hapla } 50823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 508352f91c60SVaclav Hapla } 508452f91c60SVaclav Hapla 5085d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5086d71ae5a4SJacob Faibussowitsch { 50873ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50883ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5089fbdbba38SShri Abhyankar 5090fbdbba38SShri Abhyankar PetscFunctionBegin; 50919566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5092bbead8a2SBarry Smith 50933ea6fe3dSLisandro Dalcin /* read in matrix header */ 50949566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 509508401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50969371c9d4SSatish Balay M = header[1]; 50979371c9d4SSatish Balay N = header[2]; 50989371c9d4SSatish Balay nz = header[3]; 509908401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 510008401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 510108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5102fbdbba38SShri Abhyankar 51033ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51049566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51053ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51063ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51073ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51083ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51093ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51109566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51119566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51123ea6fe3dSLisandro Dalcin 51133ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51149566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5115aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51163ea6fe3dSLisandro Dalcin 5117fbdbba38SShri Abhyankar /* read in row lengths */ 51189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51199566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51203ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51219371c9d4SSatish Balay sum = 0; 51229371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 512308401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51243ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51269566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5127aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51283ea6fe3dSLisandro Dalcin /* store row lengths */ 51299566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51309566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5131fbdbba38SShri Abhyankar 51323ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51339371c9d4SSatish Balay a->i[0] = 0; 51349371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51353ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51369566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51373ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51389566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5139fbdbba38SShri Abhyankar 51409566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51419566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5143fbdbba38SShri Abhyankar } 5144fbdbba38SShri Abhyankar 5145d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5146d71ae5a4SJacob Faibussowitsch { 51477264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5148fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5149eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5150eeffb40dSHong Zhang PetscInt k; 5151eeffb40dSHong Zhang #endif 51527264ac53SSatish Balay 51533a40ed3dSBarry Smith PetscFunctionBegin; 5154bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5155d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5156ca44d042SBarry Smith *flg = PETSC_FALSE; 51573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5158bcd2baecSBarry Smith } 51597264ac53SSatish Balay 51607264ac53SSatish Balay /* if the a->i are the same */ 51619566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51623ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51637264ac53SSatish Balay 51647264ac53SSatish Balay /* if a->j are the same */ 51659566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51663ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5167bcd2baecSBarry Smith 51689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5170bcd2baecSBarry Smith /* if a->a are the same */ 5171eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5172eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5173fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5174eeffb40dSHong Zhang *flg = PETSC_FALSE; 51753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5176eeffb40dSHong Zhang } 5177eeffb40dSHong Zhang } 5178eeffb40dSHong Zhang #else 51799566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5180eeffb40dSHong Zhang #endif 51819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51847264ac53SSatish Balay } 518536db0b34SBarry Smith 518605869f15SSatish Balay /*@ 518711a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 518836db0b34SBarry Smith provided by the user. 518936db0b34SBarry Smith 5190d083f849SBarry Smith Collective 519136db0b34SBarry Smith 519236db0b34SBarry Smith Input Parameters: 519336db0b34SBarry Smith + comm - must be an MPI communicator of size 1 519436db0b34SBarry Smith . m - number of rows 519536db0b34SBarry Smith . n - number of columns 5196483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 519736db0b34SBarry Smith . j - column indices 519836db0b34SBarry Smith - a - matrix values 519936db0b34SBarry Smith 520036db0b34SBarry Smith Output Parameter: 520136db0b34SBarry Smith . mat - the matrix 520236db0b34SBarry Smith 520336db0b34SBarry Smith Level: intermediate 520436db0b34SBarry Smith 520536db0b34SBarry Smith Notes: 52062ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5207292fb18eSBarry Smith once the matrix is destroyed and not before 520836db0b34SBarry Smith 520936db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 521036db0b34SBarry Smith 52112ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 521236db0b34SBarry Smith 5213a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5214a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52158eef79e4SBarry Smith as shown 52162ef1f0ffSBarry Smith .vb 52172ef1f0ffSBarry Smith 1 0 0 52182ef1f0ffSBarry Smith 2 0 3 52192ef1f0ffSBarry Smith 4 5 6 5220a4552177SSatish Balay 52212ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52222ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52232ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52242ef1f0ffSBarry Smith .ve 5225a4552177SSatish Balay 52261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 522736db0b34SBarry Smith @*/ 5228d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5229d71ae5a4SJacob Faibussowitsch { 5230cbcfb4deSHong Zhang PetscInt ii; 523136db0b34SBarry Smith Mat_SeqAIJ *aij; 5232cbcfb4deSHong Zhang PetscInt jj; 523336db0b34SBarry Smith 523436db0b34SBarry Smith PetscFunctionBegin; 5235aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52369566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52389566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52399566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5241ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5244ab93d7beSBarry Smith 524536db0b34SBarry Smith aij->i = i; 524636db0b34SBarry Smith aij->j = j; 524736db0b34SBarry Smith aij->a = a; 524836db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5249e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5250e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 525136db0b34SBarry Smith 5252cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 525336db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 525476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5255aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52569985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 525708401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 525808401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52599985e31cSBarry Smith } 526036db0b34SBarry Smith } 526176bd3646SJed Brown } 526276bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 526336db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 526408401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5265da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 526636db0b34SBarry Smith } 526776bd3646SJed Brown } 526836db0b34SBarry Smith 52699566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52709566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 527236db0b34SBarry Smith } 5273cbc6b225SStefano Zampini 5274f62e3866SBarry Smith /*@ 527511a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52768a0b0e6bSVictor Minden provided by the user. 52778a0b0e6bSVictor Minden 5278d083f849SBarry Smith Collective 52798a0b0e6bSVictor Minden 52808a0b0e6bSVictor Minden Input Parameters: 52818a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52828a0b0e6bSVictor Minden . m - number of rows 52838a0b0e6bSVictor Minden . n - number of columns 52848a0b0e6bSVictor Minden . i - row indices 52858a0b0e6bSVictor Minden . j - column indices 52861230e6d1SVictor Minden . a - matrix values 52871230e6d1SVictor Minden . nz - number of nonzeros 52882ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 52898a0b0e6bSVictor Minden 52908a0b0e6bSVictor Minden Output Parameter: 52918a0b0e6bSVictor Minden . mat - the matrix 52928a0b0e6bSVictor Minden 52938a0b0e6bSVictor Minden Level: intermediate 52948a0b0e6bSVictor Minden 5295f62e3866SBarry Smith Example: 5296f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52979e99939fSJunchao Zhang .vb 52988a0b0e6bSVictor Minden 1 0 0 52998a0b0e6bSVictor Minden 2 0 3 53008a0b0e6bSVictor Minden 4 5 6 53018a0b0e6bSVictor Minden 53028a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53038a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53048a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53059e99939fSJunchao Zhang .ve 5306fe59aa6dSJacob Faibussowitsch 53072ef1f0ffSBarry Smith Note: 5308d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5309d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53108a0b0e6bSVictor Minden 53111cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53128a0b0e6bSVictor Minden @*/ 5313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5314d71ae5a4SJacob Faibussowitsch { 5315d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53168a0b0e6bSVictor Minden 53178a0b0e6bSVictor Minden PetscFunctionBegin; 53189566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5319ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53209566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53219566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53229566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53241230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53251230e6d1SVictor Minden if (idx) { 53261230e6d1SVictor Minden row = i[ii] - 1; 53271230e6d1SVictor Minden col = j[ii] - 1; 53281230e6d1SVictor Minden } else { 53291230e6d1SVictor Minden row = i[ii]; 53301230e6d1SVictor Minden col = j[ii]; 53318a0b0e6bSVictor Minden } 53329566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53338a0b0e6bSVictor Minden } 53349566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53359566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53369566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53388a0b0e6bSVictor Minden } 533936db0b34SBarry Smith 5340d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5341d71ae5a4SJacob Faibussowitsch { 5342acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5343acf2f550SJed Brown 5344acf2f550SJed Brown PetscFunctionBegin; 5345acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5346acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53472205254eSKarl Rupp 53489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5350acf2f550SJed Brown } 5351acf2f550SJed Brown 5352d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5353d71ae5a4SJacob Faibussowitsch { 53549c8f2541SHong Zhang PetscFunctionBegin; 53559566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53579c8f2541SHong Zhang } 53589c8f2541SHong Zhang 535981824310SBarry Smith /* 536053dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 536153dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 536253dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 536353dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 536453dd7562SDmitry Karpeev */ 5365d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5366d71ae5a4SJacob Faibussowitsch { 536753dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 536853dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 536953dd7562SDmitry Karpeev PetscBool seqaij; 537053dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 537153dd7562SDmitry Karpeev PetscScalar v; 537253dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 537353dd7562SDmitry Karpeev 537453dd7562SDmitry Karpeev PetscFunctionBegin; 53753ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 537653dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53779566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 537828b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 537953dd7562SDmitry Karpeev if (rowemb) { 53809566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 538108401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 538253dd7562SDmitry Karpeev } else { 538308401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 538453dd7562SDmitry Karpeev } 538553dd7562SDmitry Karpeev if (colemb) { 53869566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 538708401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 538853dd7562SDmitry Karpeev } else { 538908401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 539053dd7562SDmitry Karpeev } 539153dd7562SDmitry Karpeev 5392f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 539353dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5395ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 53969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53979566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 539853dd7562SDmitry Karpeev } 539948a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 540053dd7562SDmitry Karpeev count = 0; 540153dd7562SDmitry Karpeev rowindices = NULL; 540253dd7562SDmitry Karpeev colindices = NULL; 540348a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 540448a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 540553dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 540653dd7562SDmitry Karpeev PetscInt row; 540753dd7562SDmitry Karpeev row = i; 540853dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 540953dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 541053dd7562SDmitry Karpeev PetscInt col; 541153dd7562SDmitry Karpeev col = Baij->j[count]; 541253dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 541353dd7562SDmitry Karpeev v = Baij->a[count]; 54149566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 541553dd7562SDmitry Karpeev ++count; 541653dd7562SDmitry Karpeev } 541753dd7562SDmitry Karpeev } 541853dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 541953dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 542053dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 542153dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 542253dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 542453dd7562SDmitry Karpeev } 542553dd7562SDmitry Karpeev 542658c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5427dec0b466SHong Zhang { 5428dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5429dec0b466SHong Zhang MatScalar *aa = a->a; 5430dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5431dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5432dec0b466SHong Zhang 5433dec0b466SHong Zhang PetscFunctionBegin; 5434dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5435dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5436dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5437dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5438dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 543958c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5440dec0b466SHong Zhang else { 5441dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5442dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5443dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5444dec0b466SHong Zhang } 5445dec0b466SHong Zhang } 5446dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5447dec0b466SHong Zhang fshift_prev = fshift; 5448dec0b466SHong Zhang /* reset ilen and imax for each row */ 5449dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5450dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5451dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5452dec0b466SHong Zhang } 5453312eded4SPierre Jolivet if (fshift) { 5454dec0b466SHong Zhang if (m) { 5455dec0b466SHong Zhang ai[m] -= fshift; 5456dec0b466SHong Zhang a->nz = ai[m]; 5457dec0b466SHong Zhang } 5458dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5459312eded4SPierre Jolivet A->nonzerostate++; 5460dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5461dec0b466SHong Zhang a->rmax = rmax; 5462dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5463dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5464dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5465312eded4SPierre Jolivet } 54663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5467dec0b466SHong Zhang } 5468dec0b466SHong Zhang 54694099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54704099cc6bSBarry Smith 5471cc4c1da9SBarry Smith /*@ 547211a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54734099cc6bSBarry Smith 5474c3339decSBarry Smith Collective 54754099cc6bSBarry Smith 54764099cc6bSBarry Smith Input Parameters: 54774099cc6bSBarry Smith + mat - the matrix object 54784099cc6bSBarry Smith - matype - matrix type 54794099cc6bSBarry Smith 54804099cc6bSBarry Smith Options Database Key: 54814e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54824099cc6bSBarry Smith 54834099cc6bSBarry Smith Level: intermediate 54844099cc6bSBarry Smith 5485fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 54864099cc6bSBarry Smith @*/ 5487d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5488d71ae5a4SJacob Faibussowitsch { 54894099cc6bSBarry Smith PetscBool sametype; 54905f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 54914099cc6bSBarry Smith 54924099cc6bSBarry Smith PetscFunctionBegin; 54934099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 54949566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 54953ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 54964099cc6bSBarry Smith 54979566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 54986adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 54999566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55014099cc6bSBarry Smith } 55024099cc6bSBarry Smith 55034099cc6bSBarry Smith /*@C 550411a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55054099cc6bSBarry Smith 5506cc4c1da9SBarry Smith Not Collective, No Fortran Support 55074099cc6bSBarry Smith 55084099cc6bSBarry Smith Input Parameters: 5509fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55104099cc6bSBarry Smith - function - routine to convert to subtype 55114099cc6bSBarry Smith 55122ef1f0ffSBarry Smith Level: advanced 55132ef1f0ffSBarry Smith 55144099cc6bSBarry Smith Notes: 551511a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55164099cc6bSBarry Smith 55174099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55184099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55194099cc6bSBarry Smith 55201cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55214099cc6bSBarry Smith @*/ 5522d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5523d71ae5a4SJacob Faibussowitsch { 55244099cc6bSBarry Smith PetscFunctionBegin; 55259566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55269566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55284099cc6bSBarry Smith } 55294099cc6bSBarry Smith 55304099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55314099cc6bSBarry Smith 55324099cc6bSBarry Smith /*@C 553311a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55344099cc6bSBarry Smith 55354099cc6bSBarry Smith Not Collective 55364099cc6bSBarry Smith 55374099cc6bSBarry Smith Level: advanced 55384099cc6bSBarry Smith 55392ef1f0ffSBarry Smith Note: 55402ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55412ef1f0ffSBarry Smith 55421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55434099cc6bSBarry Smith @*/ 5544d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5545d71ae5a4SJacob Faibussowitsch { 55464099cc6bSBarry Smith PetscFunctionBegin; 55473ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55484099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55494099cc6bSBarry Smith 55509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55539779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5555485f9817SRichard Tran Mills #endif 55565063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55585063d097SStefano Zampini #endif 5559d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5560d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5561d5e393b6SSuyash Tandon #endif 55625063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55645063d097SStefano Zampini #endif 55654099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55674099cc6bSBarry Smith #endif 55683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55694099cc6bSBarry Smith } 557053dd7562SDmitry Karpeev 557153dd7562SDmitry Karpeev /* 557281824310SBarry Smith Special version for direct calls from Fortran 557381824310SBarry Smith */ 557481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 557581824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 557681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 557781824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 557881824310SBarry Smith #endif 557981824310SBarry Smith 558081824310SBarry Smith /* Change these macros so can be used in void function */ 558198921bdaSJacob Faibussowitsch 558298921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55839566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55849566063dSJacob Faibussowitsch #undef PetscCall 55859371c9d4SSatish Balay #define PetscCall(...) \ 55869371c9d4SSatish Balay do { \ 55875f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 558898921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 558998921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 559098921bdaSJacob Faibussowitsch return; \ 559198921bdaSJacob Faibussowitsch } \ 559298921bdaSJacob Faibussowitsch } while (0) 559398921bdaSJacob Faibussowitsch 559498921bdaSJacob Faibussowitsch #undef SETERRQ 55959371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 55969371c9d4SSatish Balay do { \ 559798921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 559898921bdaSJacob Faibussowitsch return; \ 559998921bdaSJacob Faibussowitsch } while (0) 560081824310SBarry Smith 5601d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5602d71ae5a4SJacob Faibussowitsch { 560381824310SBarry Smith Mat A = *AA; 560481824310SBarry Smith PetscInt m = *mm, n = *nn; 560581824310SBarry Smith InsertMode is = *isis; 560681824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 560781824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 560881824310SBarry Smith PetscInt *imax, *ai, *ailen; 560981824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 561054f21887SBarry Smith MatScalar *ap, value, *aa; 5611ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5612ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 561381824310SBarry Smith 561481824310SBarry Smith PetscFunctionBegin; 56154994cf47SJed Brown MatCheckPreallocated(A, 1); 561681824310SBarry Smith imax = a->imax; 561781824310SBarry Smith ai = a->i; 561881824310SBarry Smith ailen = a->ilen; 561981824310SBarry Smith aj = a->j; 562081824310SBarry Smith aa = a->a; 562181824310SBarry Smith 562281824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 562381824310SBarry Smith row = im[k]; 562481824310SBarry Smith if (row < 0) continue; 56255f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56269371c9d4SSatish Balay rp = aj + ai[row]; 56279371c9d4SSatish Balay ap = aa + ai[row]; 56289371c9d4SSatish Balay rmax = imax[row]; 56299371c9d4SSatish Balay nrow = ailen[row]; 563081824310SBarry Smith low = 0; 563181824310SBarry Smith high = nrow; 563281824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 563381824310SBarry Smith if (in[l] < 0) continue; 56345f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 563581824310SBarry Smith col = in[l]; 56362205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56372205254eSKarl Rupp else value = v[k + l * m]; 56382205254eSKarl Rupp 563981824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 564081824310SBarry Smith 56412205254eSKarl Rupp if (col <= lastcol) low = 0; 56422205254eSKarl Rupp else high = nrow; 564381824310SBarry Smith lastcol = col; 564481824310SBarry Smith while (high - low > 5) { 564581824310SBarry Smith t = (low + high) / 2; 564681824310SBarry Smith if (rp[t] > col) high = t; 564781824310SBarry Smith else low = t; 564881824310SBarry Smith } 564981824310SBarry Smith for (i = low; i < high; i++) { 565081824310SBarry Smith if (rp[i] > col) break; 565181824310SBarry Smith if (rp[i] == col) { 565281824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 565381824310SBarry Smith else ap[i] = value; 565481824310SBarry Smith goto noinsert; 565581824310SBarry Smith } 565681824310SBarry Smith } 565781824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 565881824310SBarry Smith if (nonew == 1) goto noinsert; 56595f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5660fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56619371c9d4SSatish Balay N = nrow++ - 1; 56629371c9d4SSatish Balay a->nz++; 56639371c9d4SSatish Balay high++; 566481824310SBarry Smith /* shift up all the later entries in this row */ 566581824310SBarry Smith for (ii = N; ii >= i; ii--) { 566681824310SBarry Smith rp[ii + 1] = rp[ii]; 566781824310SBarry Smith ap[ii + 1] = ap[ii]; 566881824310SBarry Smith } 566981824310SBarry Smith rp[i] = col; 567081824310SBarry Smith ap[i] = value; 567181824310SBarry Smith noinsert:; 567281824310SBarry Smith low = i + 1; 567381824310SBarry Smith } 567481824310SBarry Smith ailen[row] = nrow; 567581824310SBarry Smith } 567681824310SBarry Smith PetscFunctionReturnVoid(); 567781824310SBarry Smith } 567898921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 567998921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 568098921bdaSJacob Faibussowitsch * original definitions */ 56819566063dSJacob Faibussowitsch #undef PetscCall 568298921bdaSJacob Faibussowitsch #undef SETERRQ 5683