1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 57748a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 5809566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 666e457bb90SBarry Smith if (PetscDefined(USE_DEBUG)) { 667e457bb90SBarry Smith PetscInt mnz = 0; 668e457bb90SBarry Smith 669e457bb90SBarry Smith for (i = 0; i < m; i++) mnz += rowlens[i]; 670e457bb90SBarry Smith PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz); 671e457bb90SBarry Smith } 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 719bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7203ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7212e5835c6SStefano Zampini 722c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72571c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72697f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72760e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 728c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 729d00d2cf4SBarry Smith nofinalvalue = 1; 730d00d2cf4SBarry Smith } 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #else 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 738fbfe6fa7SJed Brown #endif 7399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 74017ab2063SBarry Smith 74117ab2063SBarry Smith for (i = 0; i < m; i++) { 74260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74517ab2063SBarry Smith #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74717ab2063SBarry Smith #endif 74817ab2063SBarry Smith } 74917ab2063SBarry Smith } 750d00d2cf4SBarry Smith if (nofinalvalue) { 751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 753c337ccceSJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 755c337ccceSJed Brown #endif 756d00d2cf4SBarry Smith } 7579566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 760fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76244cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 77036db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7726831982aSBarry Smith } 77344cd7ae7SLois Curfman McInnes #else 7749566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77544cd7ae7SLois Curfman McInnes #endif 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77844cd7ae7SLois Curfman McInnes } 7799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 780fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78197f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 784496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 785496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 787496be53dSLois Curfman McInnes if (a->j[j] >= i) { 788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 790496be53dSLois Curfman McInnes #else 791496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 792496be53dSLois Curfman McInnes #endif 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 795496be53dSLois Curfman McInnes } 7962e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7982e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7992205254eSKarl Rupp if (i + 4 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8012205254eSKarl Rupp } else if (i + 3 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8032205254eSKarl Rupp } else if (i + 2 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8052205254eSKarl Rupp } else if (i + 1 < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8072205254eSKarl Rupp } else if (i < m) { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8092205254eSKarl Rupp } else { 8109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8112205254eSKarl Rupp } 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8149566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 815496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8179566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes } 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 822496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 824496be53dSLois Curfman McInnes if (a->j[j] >= i) { 825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82648a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 827496be53dSLois Curfman McInnes #else 8289566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 829496be53dSLois Curfman McInnes #endif 830496be53dSLois Curfman McInnes } 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 833496be53dSLois Curfman McInnes } 8349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 835fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83697f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83787828ca2SBarry Smith PetscScalar value; 83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83968f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 84068f1ed48SBarry Smith 84168f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84268f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84368f1ed48SBarry Smith realonly = PETSC_FALSE; 84468f1ed48SBarry Smith break; 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith } 84768f1ed48SBarry Smith #endif 84802594712SBarry Smith 8499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 85002594712SBarry Smith for (i = 0; i < m; i++) { 85102594712SBarry Smith jcnt = 0; 852d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 853e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85402594712SBarry Smith value = a->a[cnt++]; 855e24b481bSBarry Smith jcnt++; 85602594712SBarry Smith } else { 85702594712SBarry Smith value = 0.0; 85802594712SBarry Smith } 859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86068f1ed48SBarry Smith if (realonly) { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86268f1ed48SBarry Smith } else { 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86468f1ed48SBarry Smith } 86502594712SBarry Smith #else 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86702594712SBarry Smith #endif 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 87002594712SBarry Smith } 8719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8723c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 873150b93efSMatthew G. Knepley PetscInt fshift = 1; 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8793c215bfdSMatthew Knepley #endif 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8813c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8853c215bfdSMatthew Knepley #else 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8873c215bfdSMatthew Knepley #endif 8883c215bfdSMatthew Knepley } 8893c215bfdSMatthew Knepley } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8913a40ed3dSBarry Smith } else { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 893d5f3da31SBarry Smith if (A->factortype) { 89416cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89616cd7e1dSShri Abhyankar /* L part */ 89760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90316cd7e1dSShri Abhyankar } else { 9049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90516cd7e1dSShri Abhyankar } 90616cd7e1dSShri Abhyankar #else 9079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90816cd7e1dSShri Abhyankar #endif 90916cd7e1dSShri Abhyankar } 91016cd7e1dSShri Abhyankar /* diagonal */ 91116cd7e1dSShri Abhyankar j = a->diag[i]; 91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 914835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j]))); 91516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 916835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j])))); 91716cd7e1dSShri Abhyankar } else { 918835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j]))); 91916cd7e1dSShri Abhyankar } 92016cd7e1dSShri Abhyankar #else 921835f2295SStefano Zampini PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j]))); 92216cd7e1dSShri Abhyankar #endif 92316cd7e1dSShri Abhyankar 92416cd7e1dSShri Abhyankar /* U part */ 92560e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93116cd7e1dSShri Abhyankar } else { 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar #else 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93616cd7e1dSShri Abhyankar #endif 93716cd7e1dSShri Abhyankar } 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93916cd7e1dSShri Abhyankar } 94016cd7e1dSShri Abhyankar } else { 94117ab2063SBarry Smith for (i = 0; i < m; i++) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9493a40ed3dSBarry Smith } else { 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95117ab2063SBarry Smith } 95217ab2063SBarry Smith #else 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95417ab2063SBarry Smith #endif 95517ab2063SBarry Smith } 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95717ab2063SBarry Smith } 95816cd7e1dSShri Abhyankar } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 96017ab2063SBarry Smith } 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 963416022c9SBarry Smith } 964416022c9SBarry Smith 9659804daf3SBarry Smith #include <petscdraw.h> 966ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 967d71ae5a4SJacob Faibussowitsch { 968480ef9eaSBarry Smith Mat A = (Mat)Aa; 969416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 970383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 971383922c3SLisandro Dalcin int color; 972b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 973b0a32e0cSBarry Smith PetscViewer viewer; 974f3ef73ceSBarry Smith PetscViewerFormat format; 975fff043a9SJunchao Zhang const PetscScalar *aa; 976cddf8d76SBarry Smith 9773a40ed3dSBarry Smith PetscFunctionBegin; 9789566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9799566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9809566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 981383922c3SLisandro Dalcin 982416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 984fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 985d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9860513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 987b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 988416022c9SBarry Smith for (i = 0; i < m; i++) { 9899371c9d4SSatish Balay y_l = m - i - 1.0; 9909371c9d4SSatish Balay y_r = y_l + 1.0; 991bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9929371c9d4SSatish Balay x_l = a->j[j]; 9939371c9d4SSatish Balay x_r = x_l + 1.0; 994fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9959566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 996cddf8d76SBarry Smith } 997cddf8d76SBarry Smith } 998b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 999cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10009371c9d4SSatish Balay y_l = m - i - 1.0; 10019371c9d4SSatish Balay y_r = y_l + 1.0; 1002bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10039371c9d4SSatish Balay x_l = a->j[j]; 10049371c9d4SSatish Balay x_r = x_l + 1.0; 1005fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1007cddf8d76SBarry Smith } 1008cddf8d76SBarry Smith } 1009b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1010cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10119371c9d4SSatish Balay y_l = m - i - 1.0; 10129371c9d4SSatish Balay y_r = y_l + 1.0; 1013bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10149371c9d4SSatish Balay x_l = a->j[j]; 10159371c9d4SSatish Balay x_r = x_l + 1.0; 1016fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10179566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1018416022c9SBarry Smith } 1019416022c9SBarry Smith } 1020d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10210513a670SBarry Smith } else { 10220513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10230513a670SBarry Smith /* first determine max of all nonzero values */ 1024b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1025383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1026b0a32e0cSBarry Smith PetscDraw popup; 10270513a670SBarry Smith 10280513a670SBarry Smith for (i = 0; i < nz; i++) { 1029fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10300513a670SBarry Smith } 1031383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10339566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1034383922c3SLisandro Dalcin 1035d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10360513a670SBarry Smith for (i = 0; i < m; i++) { 1037383922c3SLisandro Dalcin y_l = m - i - 1.0; 1038383922c3SLisandro Dalcin y_r = y_l + 1.0; 1039bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1040383922c3SLisandro Dalcin x_l = a->j[j]; 1041383922c3SLisandro Dalcin x_r = x_l + 1.0; 1042fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10439566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10440513a670SBarry Smith count++; 10450513a670SBarry Smith } 10460513a670SBarry Smith } 1047d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10480513a670SBarry Smith } 10499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1051480ef9eaSBarry Smith } 1052cddf8d76SBarry Smith 10539804daf3SBarry Smith #include <petscdraw.h> 1054ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1055d71ae5a4SJacob Faibussowitsch { 1056b0a32e0cSBarry Smith PetscDraw draw; 105736db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1058ace3abfcSBarry Smith PetscBool isnull; 1059480ef9eaSBarry Smith 1060480ef9eaSBarry Smith PetscFunctionBegin; 10619566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10629566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10633ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1064480ef9eaSBarry Smith 10659371c9d4SSatish Balay xr = A->cmap->n; 10669371c9d4SSatish Balay yr = A->rmap->n; 10679371c9d4SSatish Balay h = yr / 10.0; 10689371c9d4SSatish Balay w = xr / 10.0; 10699371c9d4SSatish Balay xr += w; 10709371c9d4SSatish Balay yr += h; 10719371c9d4SSatish Balay xl = -w; 10729371c9d4SSatish Balay yl = -h; 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10769566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10779566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1079416022c9SBarry Smith } 1080416022c9SBarry Smith 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1082d71ae5a4SJacob Faibussowitsch { 1083ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1084416022c9SBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10891baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10901baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10911baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10929566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109417ab2063SBarry Smith } 109519bcc07fSBarry Smith 1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1097d71ae5a4SJacob Faibussowitsch { 1098416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1099580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1100bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 110154f21887SBarry Smith MatScalar *aa = a->a, *ap; 11023447b6efSHong Zhang PetscReal ratio = 0.6; 110317ab2063SBarry Smith 11043a40ed3dSBarry Smith PetscFunctionBegin; 11053ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1107b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1108b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111b215bc84SStefano Zampini } 111217ab2063SBarry Smith 111343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111417ab2063SBarry Smith for (i = 1; i < m; i++) { 1115416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111617ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111794a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111817ab2063SBarry Smith if (fshift) { 1119bfeeae90SHong Zhang ip = aj + ai[i]; 1120bfeeae90SHong Zhang ap = aa + ai[i]; 112117ab2063SBarry Smith N = ailen[i]; 11229566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112417ab2063SBarry Smith } 112517ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112617ab2063SBarry Smith } 112717ab2063SBarry Smith if (m) { 112817ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112917ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 113017ab2063SBarry Smith } 113117ab2063SBarry Smith /* reset ilen and imax for each row */ 11327b083b7cSBarry Smith a->nonzerorowcnt = 0; 1133396832f4SHong Zhang if (A->structure_only) { 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1136396832f4SHong Zhang } else { /* !A->structure_only */ 113717ab2063SBarry Smith for (i = 0; i < m; i++) { 113817ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11397b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 114017ab2063SBarry Smith } 1141396832f4SHong Zhang } 1142bfeeae90SHong Zhang a->nz = ai[m]; 1143aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1144bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1145bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1146bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1147bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1148bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1149bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1150bc43efbbSJunchao Zhang break; 1151bc43efbbSJunchao Zhang } 1152bc43efbbSJunchao Zhang } 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11559566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11562205254eSKarl Rupp 11578e58a170SBarry Smith A->info.mallocs += a->reallocs; 1158dd5f02e7SSatish Balay a->reallocs = 0; 11596712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 116036db0b34SBarry Smith a->rmax = rmax; 11614e220ebcSLois Curfman McInnes 116248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11639566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116517ab2063SBarry Smith } 116617ab2063SBarry Smith 1167ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 118399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118499cafbc1SBarry Smith PetscInt i, nz = a->nz; 11852e5835c6SStefano Zampini MatScalar *aa; 118699cafbc1SBarry Smith 118799cafbc1SBarry Smith PetscFunctionBegin; 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119399cafbc1SBarry Smith } 119499cafbc1SBarry Smith 1195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1196d71ae5a4SJacob Faibussowitsch { 1197fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1198fff043a9SJunchao Zhang MatScalar *aa; 11993a40ed3dSBarry Smith 12003a40ed3dSBarry Smith PetscFunctionBegin; 12019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12029566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120617ab2063SBarry Smith } 1207416022c9SBarry Smith 1208674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A) 1209d71ae5a4SJacob Faibussowitsch { 1210416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1211d5d45c9bSBarry Smith 12123a40ed3dSBarry Smith PetscFunctionBegin; 1213b4e2f619SBarry Smith if (A->hash_active) { 1214e3c72094SPierre Jolivet A->ops[0] = a->cops; 1215b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1216b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1217b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1218b4e2f619SBarry Smith } 1219b4e2f619SBarry Smith 12203ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12219566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12309566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12319566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12339566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12349566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 1235674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1236674b392bSAlexander } 1237674b392bSAlexander 1238674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A) 1239674b392bSAlexander { 1240674b392bSAlexander PetscFunctionBegin; 1241674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 1242674b392bSAlexander PetscCall(MatCreate_SeqAIJ_Inode(A)); 1243674b392bSAlexander PetscCall(MatSetUp_Seq_Hash(A)); 1244674b392bSAlexander A->nonzerostate++; 1245674b392bSAlexander PetscFunctionReturn(PETSC_SUCCESS); 1246674b392bSAlexander } 1247674b392bSAlexander 1248674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1249674b392bSAlexander { 1250674b392bSAlexander PetscFunctionBegin; 1251674b392bSAlexander PetscCall(MatReset_SeqAIJ(A)); 12529566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1253901853e0SKris Buschelman 12546718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12556718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12566718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12576718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12586718818eSStefano Zampini due to different matrix sizes */ 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12606718818eSStefano Zampini 12619566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12622e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12632e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12702e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12712e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12722e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12732e956fe4SStefano Zampini #endif 12744222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12784222ddf1SHong Zhang #endif 1279d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1280d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1281d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1282d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1283d5e393b6SSuyash Tandon #endif 12843d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12863d0639e7SStefano Zampini #endif 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1288af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1290af8000cdSHong Zhang #endif 1291d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1293d24d4204SJose E. Roman #endif 129463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 129763c07aadSStefano Zampini #endif 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 13022e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 13039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 13049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 1305674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL)); 13069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 13079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 13089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 13099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 13109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 13119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 13129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 13139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 13142e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 13152e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 13162e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 13172e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13182e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13192e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13202e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 132217ab2063SBarry Smith } 132317ab2063SBarry Smith 1324d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1325d71ae5a4SJacob Faibussowitsch { 1326416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13273a40ed3dSBarry Smith 13283a40ed3dSBarry Smith PetscFunctionBegin; 1329a65d3064SKris Buschelman switch (op) { 1330d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1331d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1332d71ae5a4SJacob Faibussowitsch break; 1333d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1334d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1335d71ae5a4SJacob Faibussowitsch break; 1336d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1337d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1338d71ae5a4SJacob Faibussowitsch break; 1339d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1340d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1341d71ae5a4SJacob Faibussowitsch break; 1342d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1343d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1344d71ae5a4SJacob Faibussowitsch break; 1345d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1346d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1347d71ae5a4SJacob Faibussowitsch break; 1348d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1349d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1350d71ae5a4SJacob Faibussowitsch break; 1351d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1352d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1353d71ae5a4SJacob Faibussowitsch break; 1354d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1355d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1356d71ae5a4SJacob Faibussowitsch break; 1357071fcb05SBarry Smith case MAT_SORTED_FULL: 1358071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1359071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1360071fcb05SBarry Smith break; 1361d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1362d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1363d71ae5a4SJacob Faibussowitsch break; 1364d71ae5a4SJacob Faibussowitsch default: 1365*888c827cSStefano Zampini break; 1366a65d3064SKris Buschelman } 13673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136817ab2063SBarry Smith } 136917ab2063SBarry Smith 1370ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1371d71ae5a4SJacob Faibussowitsch { 1372416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1373fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1374c898d852SStefano Zampini PetscScalar *x; 1375c898d852SStefano Zampini const PetscScalar *aa; 137617ab2063SBarry Smith 13773a40ed3dSBarry Smith PetscFunctionBegin; 13789566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137908401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1381d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1382d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13839566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13842c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13859566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138835e7444dSHong Zhang } 138935e7444dSHong Zhang 13909566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 139135e7444dSHong Zhang for (i = 0; i < n; i++) { 1392fdc842d1SBarry Smith x[i] = 0.0; 139335e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139435e7444dSHong Zhang if (aj[j] == i) { 139535e7444dSHong Zhang x[i] = aa[j]; 139617ab2063SBarry Smith break; 139717ab2063SBarry Smith } 139817ab2063SBarry Smith } 139917ab2063SBarry Smith } 14009566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 14019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 140317ab2063SBarry Smith } 140417ab2063SBarry Smith 1405c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1406d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1407d71ae5a4SJacob Faibussowitsch { 1408416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14095f22a7b3SSebastian Grimberg const MatScalar *aa; 1410d9ca1df4SBarry Smith PetscScalar *y; 1411d9ca1df4SBarry Smith const PetscScalar *x; 1412d0f46423SBarry Smith PetscInt m = A->rmap->n; 14135c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14145f22a7b3SSebastian Grimberg const MatScalar *v; 1415a77337e4SBarry Smith PetscScalar alpha; 1416d9ca1df4SBarry Smith PetscInt n, i, j; 1417d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14183447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1419ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14205c897100SBarry Smith #endif 142117ab2063SBarry Smith 14223a40ed3dSBarry Smith PetscFunctionBegin; 14239566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14249566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14259566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14275c897100SBarry Smith 14285c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1429fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14305c897100SBarry Smith #else 14313447b6efSHong Zhang if (usecprow) { 14323447b6efSHong Zhang m = cprow.nrows; 14333447b6efSHong Zhang ii = cprow.i; 14347b2bb3b9SHong Zhang ridx = cprow.rindex; 14353447b6efSHong Zhang } else { 14363447b6efSHong Zhang ii = a->i; 14373447b6efSHong Zhang } 143817ab2063SBarry Smith for (i = 0; i < m; i++) { 14393447b6efSHong Zhang idx = a->j + ii[i]; 1440fff043a9SJunchao Zhang v = aa + ii[i]; 14413447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14423447b6efSHong Zhang if (usecprow) { 14437b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14443447b6efSHong Zhang } else { 144517ab2063SBarry Smith alpha = x[i]; 14463447b6efSHong Zhang } 144704fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144817ab2063SBarry Smith } 14495c897100SBarry Smith #endif 14509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14519566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14529566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145517ab2063SBarry Smith } 145617ab2063SBarry Smith 1457d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1458d71ae5a4SJacob Faibussowitsch { 14595c897100SBarry Smith PetscFunctionBegin; 14609566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14619566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14635c897100SBarry Smith } 14645c897100SBarry Smith 1465c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146678b84d54SShri Abhyankar 1467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1468d71ae5a4SJacob Faibussowitsch { 1469416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1470d9fead3dSBarry Smith PetscScalar *y; 147154f21887SBarry Smith const PetscScalar *x; 14725914357eSBarry Smith const MatScalar *a_a; 1473003131ecSBarry Smith PetscInt m = A->rmap->n; 14745914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1475ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147617ab2063SBarry Smith 1477b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147897952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1479fee21e36SBarry Smith #endif 1480fee21e36SBarry Smith 14813a40ed3dSBarry Smith PetscFunctionBegin; 1482b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14839566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1485b215bc84SStefano Zampini } 14869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14879566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14889566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1489416022c9SBarry Smith ii = a->i; 14904eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149297952fefSHong Zhang m = a->compressedrow.nrows; 149397952fefSHong Zhang ii = a->compressedrow.i; 149497952fefSHong Zhang ridx = a->compressedrow.rindex; 14955914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14965914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 14975914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 14985914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 14995914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15005914357eSBarry Smith PetscScalar sum = 0.0; 1501003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1502003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150397952fefSHong Zhang y[*ridx++] = sum; 150497952fefSHong Zhang } 150597952fefSHong Zhang } else { /* do not use compressed row format */ 1506b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15075914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1508b05257ddSBarry Smith #else 15095914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15105914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15115914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15125914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15135914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15145914357eSBarry Smith PetscScalar sum = 0.0; 1515003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151617ab2063SBarry Smith y[i] = sum; 151717ab2063SBarry Smith } 15188d195f9aSBarry Smith #endif 1519b05257ddSBarry Smith } 15209566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15229566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152517ab2063SBarry Smith } 152617ab2063SBarry Smith 1527ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1528ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1529d71ae5a4SJacob Faibussowitsch { 1530b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1531b434eb95SMatthew G. Knepley PetscScalar *y; 1532b434eb95SMatthew G. Knepley const PetscScalar *x; 1533fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1534b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1535b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1536b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1537b434eb95SMatthew G. Knepley PetscScalar sum; 1538b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1539b434eb95SMatthew G. Knepley 1540b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1541b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1542b434eb95SMatthew G. Knepley #endif 1543b434eb95SMatthew G. Knepley 1544b434eb95SMatthew G. Knepley PetscFunctionBegin; 15459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15469566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15479566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1548b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1549b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1550b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1551b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1552b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1553b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1554b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1555fff043a9SJunchao Zhang aa = a_a + ii[i]; 1556b434eb95SMatthew G. Knepley sum = 0.0; 1557b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1558b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1559b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1560b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1561b434eb95SMatthew G. Knepley } 1562b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15633d3eaba7SBarry Smith ii = a->i; 1564b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1565b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1566b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1567fff043a9SJunchao Zhang aa = a_a + ii[i]; 1568b434eb95SMatthew G. Knepley sum = 0.0; 1569b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1570b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1571b434eb95SMatthew G. Knepley y[i] = sum; 1572b434eb95SMatthew G. Knepley } 1573b434eb95SMatthew G. Knepley } 15749566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15759566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15769566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1579b434eb95SMatthew G. Knepley } 1580b434eb95SMatthew G. Knepley 1581ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1582ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1583d71ae5a4SJacob Faibussowitsch { 1584b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1585b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1586b434eb95SMatthew G. Knepley const PetscScalar *x; 1587fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1588b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1589b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1590b434eb95SMatthew G. Knepley PetscScalar sum; 1591b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1592b434eb95SMatthew G. Knepley 1593b434eb95SMatthew G. Knepley PetscFunctionBegin; 15949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15959566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15969566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1597b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159848a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1599b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1600b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1601b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1602b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1603b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1604b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1605fff043a9SJunchao Zhang aa = a_a + ii[i]; 1606b434eb95SMatthew G. Knepley sum = y[*ridx]; 1607b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1608b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1609b434eb95SMatthew G. Knepley } 1610b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16113d3eaba7SBarry Smith ii = a->i; 1612b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1613b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1614b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1615fff043a9SJunchao Zhang aa = a_a + ii[i]; 1616b434eb95SMatthew G. Knepley sum = y[i]; 1617b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1618b434eb95SMatthew G. Knepley z[i] = sum; 1619b434eb95SMatthew G. Knepley } 1620b434eb95SMatthew G. Knepley } 16219566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16229566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16239566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1626b434eb95SMatthew G. Knepley } 1627b434eb95SMatthew G. Knepley 1628c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1629d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1630d71ae5a4SJacob Faibussowitsch { 1631416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1632f15663dcSBarry Smith PetscScalar *y, *z; 1633f15663dcSBarry Smith const PetscScalar *x; 16345914357eSBarry Smith const MatScalar *a_a; 16355914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16365914357eSBarry Smith PetscInt m = A->rmap->n; 1637ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16389ea0dfa2SSatish Balay 16393a40ed3dSBarry Smith PetscFunctionBegin; 1640b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16419566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1643b215bc84SStefano Zampini } 16449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16459566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16469566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16474eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164848a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164997952fefSHong Zhang m = a->compressedrow.nrows; 165097952fefSHong Zhang ii = a->compressedrow.i; 165197952fefSHong Zhang ridx = a->compressedrow.rindex; 16525914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16535914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16545914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16555914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16565914357eSBarry Smith PetscScalar sum = y[*ridx]; 1657f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165897952fefSHong Zhang z[*ridx++] = sum; 165997952fefSHong Zhang } 166097952fefSHong Zhang } else { /* do not use compressed row format */ 16613d3eaba7SBarry Smith ii = a->i; 1662f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16635914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1664f15663dcSBarry Smith #else 16655914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16665914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16675914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16685914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16695914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16705914357eSBarry Smith PetscScalar sum = y[i]; 1671f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167217ab2063SBarry Smith z[i] = sum; 167317ab2063SBarry Smith } 167402ab625aSSatish Balay #endif 1675f15663dcSBarry Smith } 16769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168117ab2063SBarry Smith } 168217ab2063SBarry Smith 168317ab2063SBarry Smith /* 16840b4b7b1cSBarry Smith Adds diagonal pointers to sparse matrix nonzero structure. 168517ab2063SBarry Smith */ 1686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1687d71ae5a4SJacob Faibussowitsch { 1688416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1689d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1690c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169117ab2063SBarry Smith 16923a40ed3dSBarry Smith PetscFunctionBegin; 169309f38230SBarry Smith if (!a->diag) { 16949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1695c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169609f38230SBarry Smith } 1697d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1698c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1699c0c07093SJunchao Zhang if (alreadySet) { 1700c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1701c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1702c0c07093SJunchao Zhang } 1703c0c07093SJunchao Zhang 170409f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1705bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1706bfeeae90SHong Zhang if (a->j[j] == i) { 170709f38230SBarry Smith a->diag[i] = j; 170817ab2063SBarry Smith break; 170917ab2063SBarry Smith } 171017ab2063SBarry Smith } 171117ab2063SBarry Smith } 17123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171317ab2063SBarry Smith } 171417ab2063SBarry Smith 1715ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1716d71ae5a4SJacob Faibussowitsch { 171761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172061ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172261ecd0c6SBarry Smith 172361ecd0c6SBarry Smith PetscFunctionBegin; 172461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17269566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172861ecd0c6SBarry Smith } 172961ecd0c6SBarry Smith 173061ecd0c6SBarry Smith if (a->diagonaldense) { 173161ecd0c6SBarry Smith cnt = 0; 173261ecd0c6SBarry Smith } else { 17339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1735349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173661ecd0c6SBarry Smith cnt++; 173761ecd0c6SBarry Smith mdiag[i] = 1; 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith if (!cnt) { 17429566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174361ecd0c6SBarry Smith } else { 1744b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1745b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 17469f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 17476ea2a7edSJunchao Zhang const PetscScalar *Aa; 17486ea2a7edSJunchao Zhang 17496ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17506ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 175161ecd0c6SBarry Smith 175261ecd0c6SBarry Smith a->a = NULL; 175361ecd0c6SBarry Smith a->j = NULL; 175461ecd0c6SBarry Smith a->i = NULL; 175561ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1756ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175861ecd0c6SBarry Smith 175961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17619566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176248a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1763447d62f5SStefano Zampini } 17649566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17669f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17679f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17689f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 176961ecd0c6SBarry Smith } 17709566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177161ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177361ecd0c6SBarry Smith } 177461ecd0c6SBarry Smith 1775be5855fcSBarry Smith /* 1776be5855fcSBarry Smith Checks for missing diagonals 1777be5855fcSBarry Smith */ 1778d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1779d71ae5a4SJacob Faibussowitsch { 1780be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17817734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1782be5855fcSBarry Smith 1783be5855fcSBarry Smith PetscFunctionBegin; 178409f38230SBarry Smith *missing = PETSC_FALSE; 17857734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 178609f38230SBarry Smith *missing = PETSC_TRUE; 178709f38230SBarry Smith if (d) *d = 0; 17889566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178909f38230SBarry Smith } else { 179001445905SHong Zhang PetscInt n; 179101445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1792f1e2ffcdSBarry Smith diag = a->diag; 179301445905SHong Zhang for (i = 0; i < n; i++) { 17947734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179509f38230SBarry Smith *missing = PETSC_TRUE; 179609f38230SBarry Smith if (d) *d = i; 17979566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1798358d2f5dSShri Abhyankar break; 179909f38230SBarry Smith } 1800be5855fcSBarry Smith } 1801be5855fcSBarry Smith } 18023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1803be5855fcSBarry Smith } 1804be5855fcSBarry Smith 18050da83c2eSBarry Smith #include <petscblaslapack.h> 18060da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18070da83c2eSBarry Smith 18080da83c2eSBarry Smith /* 18090da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18100da83c2eSBarry Smith */ 1811ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1812d71ae5a4SJacob Faibussowitsch { 18130da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18140da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18150da83c2eSBarry Smith const PetscReal shift = 0.0; 18160da83c2eSBarry Smith PetscInt ipvt[5]; 18174e208921SJed Brown PetscCount flops = 0; 18180da83c2eSBarry Smith PetscScalar work[25], *v_work; 18190da83c2eSBarry Smith 18200da83c2eSBarry Smith PetscFunctionBegin; 18210da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18220da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182308401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1824ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 182648a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18270da83c2eSBarry Smith ncnt = 0; 18280da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18290da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18309566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18310da83c2eSBarry Smith switch (bsizes[i]) { 1832d71ae5a4SJacob Faibussowitsch case 1: 1833d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1834d71ae5a4SJacob Faibussowitsch break; 18350da83c2eSBarry Smith case 2: 18369566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18370da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18389566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18390da83c2eSBarry Smith break; 18400da83c2eSBarry Smith case 3: 18419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18420da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18440da83c2eSBarry Smith break; 18450da83c2eSBarry Smith case 4: 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18470da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18489566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18490da83c2eSBarry Smith break; 18500da83c2eSBarry Smith case 5: 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18520da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18540da83c2eSBarry Smith break; 18550da83c2eSBarry Smith case 6: 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18570da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18590da83c2eSBarry Smith break; 18600da83c2eSBarry Smith case 7: 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18620da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18639566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18640da83c2eSBarry Smith break; 18650da83c2eSBarry Smith default: 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18670da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18689566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18690da83c2eSBarry Smith } 18700da83c2eSBarry Smith ncnt += bsizes[i]; 18710da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1872baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18730da83c2eSBarry Smith } 18743ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187548a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18769566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18780da83c2eSBarry Smith } 18790da83c2eSBarry Smith 1880422a814eSBarry Smith /* 1881422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1882422a814eSBarry Smith */ 1883ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1884d71ae5a4SJacob Faibussowitsch { 188571f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1886d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18872e5835c6SStefano Zampini const MatScalar *v; 188854f21887SBarry Smith PetscScalar *idiag, *mdiag; 188971f1c65dSBarry Smith 189071f1c65dSBarry Smith PetscFunctionBegin; 18913ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18929566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189371f1c65dSBarry Smith diag = a->diag; 18944dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18952e5835c6SStefano Zampini 189671f1c65dSBarry Smith mdiag = a->mdiag; 189771f1c65dSBarry Smith idiag = a->idiag; 18989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1899422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190071f1c65dSBarry Smith for (i = 0; i < m; i++) { 190171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1902899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1903899639b0SHong Zhang if (PetscRealPart(fshift)) { 19049566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19057b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19067b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19077b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 190898921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1909899639b0SHong Zhang } 191071f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191171f1c65dSBarry Smith } 19129566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191371f1c65dSBarry Smith } else { 191471f1c65dSBarry Smith for (i = 0; i < m; i++) { 191571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 191671f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 191771f1c65dSBarry Smith } 19189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191971f1c65dSBarry Smith } 192071f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192371f1c65dSBarry Smith } 192471f1c65dSBarry Smith 1925d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1926d71ae5a4SJacob Faibussowitsch { 1927416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1928e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19292e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193054f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19313d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193297f1f81fSBarry Smith const PetscInt *idx, *diag; 193317ab2063SBarry Smith 19343a40ed3dSBarry Smith PetscFunctionBegin; 1935b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19369566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1938b215bc84SStefano Zampini } 1939b965ef7fSBarry Smith its = its * lits; 194091723122SBarry Smith 194171f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19429566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194371f1c65dSBarry Smith a->fshift = fshift; 194471f1c65dSBarry Smith a->omega = omega; 1945ed480e8bSBarry Smith 194671f1c65dSBarry Smith diag = a->diag; 194771f1c65dSBarry Smith t = a->ssor_work; 1948ed480e8bSBarry Smith idiag = a->idiag; 194971f1c65dSBarry Smith mdiag = a->mdiag; 1950ed480e8bSBarry Smith 19519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19529566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19539566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1954ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195517ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195617ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1957ed480e8bSBarry Smith bs = b; 195817ab2063SBarry Smith for (i = 0; i < m; i++) { 195971f1c65dSBarry Smith d = fshift + mdiag[i]; 1960416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1961ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19622e5835c6SStefano Zampini v = aa + diag[i] + 1; 196317ab2063SBarry Smith sum = b[i] * d / omega; 1964003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196517ab2063SBarry Smith x[i] = sum; 196617ab2063SBarry Smith } 19679566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19689566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19709566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197217ab2063SBarry Smith } 1973c783ea89SBarry Smith 197408401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1975f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19764c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1977887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 197817ab2063SBarry Smith 197917ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198017ab2063SBarry Smith 1981887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198217ab2063SBarry Smith */ 198317ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198417ab2063SBarry Smith 198517ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1987416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1988ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19892e5835c6SStefano Zampini v = aa + diag[i] + 1; 199017ab2063SBarry Smith sum = b[i]; 1991e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1992ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199317ab2063SBarry Smith } 199417ab2063SBarry Smith 199517ab2063SBarry Smith /* t = b - (2*E - D)x */ 19962e5835c6SStefano Zampini v = aa; 19972205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 199817ab2063SBarry Smith 199917ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2000ed480e8bSBarry Smith ts = t; 2001416022c9SBarry Smith diag = a->diag; 200217ab2063SBarry Smith for (i = 0; i < m; i++) { 2003416022c9SBarry Smith n = diag[i] - a->i[i]; 2004ed480e8bSBarry Smith idx = a->j + a->i[i]; 20052e5835c6SStefano Zampini v = aa + a->i[i]; 200617ab2063SBarry Smith sum = t[i]; 2007003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2008ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2009733d66baSBarry Smith /* x = x + t */ 2010733d66baSBarry Smith x[i] += t[i]; 201117ab2063SBarry Smith } 201217ab2063SBarry Smith 20139566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20149566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20159566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 201717ab2063SBarry Smith } 201817ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201917ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202017ab2063SBarry Smith for (i = 0; i < m; i++) { 2021416022c9SBarry Smith n = diag[i] - a->i[i]; 2022ed480e8bSBarry Smith idx = a->j + a->i[i]; 20232e5835c6SStefano Zampini v = aa + a->i[i]; 202417ab2063SBarry Smith sum = b[i]; 2025e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20265c99c7daSBarry Smith t[i] = sum; 2027ed480e8bSBarry Smith x[i] = sum * idiag[i]; 202817ab2063SBarry Smith } 20295c99c7daSBarry Smith xb = t; 20309566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20313a40ed3dSBarry Smith } else xb = b; 203217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203317ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2034416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2035ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20362e5835c6SStefano Zampini v = aa + diag[i] + 1; 203717ab2063SBarry Smith sum = xb[i]; 2038e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20395c99c7daSBarry Smith if (xb == b) { 2040ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20415c99c7daSBarry Smith } else { 2042b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204317ab2063SBarry Smith } 20445c99c7daSBarry Smith } 20459566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204617ab2063SBarry Smith } 204717ab2063SBarry Smith its--; 204817ab2063SBarry Smith } 204917ab2063SBarry Smith while (its--) { 205017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205117ab2063SBarry Smith for (i = 0; i < m; i++) { 2052b19a5dc2SMark Adams /* lower */ 2053b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2054ed480e8bSBarry Smith idx = a->j + a->i[i]; 20552e5835c6SStefano Zampini v = aa + a->i[i]; 205617ab2063SBarry Smith sum = b[i]; 2057e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2058b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2059b19a5dc2SMark Adams /* upper */ 2060b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2061b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20622e5835c6SStefano Zampini v = aa + diag[i] + 1; 2063b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2064b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206517ab2063SBarry Smith } 2066b19a5dc2SMark Adams xb = t; 20679566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2068b19a5dc2SMark Adams } else xb = b; 206917ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207017ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2071b19a5dc2SMark Adams sum = xb[i]; 2072b19a5dc2SMark Adams if (xb == b) { 2073b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2074416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2075ed480e8bSBarry Smith idx = a->j + a->i[i]; 20762e5835c6SStefano Zampini v = aa + a->i[i]; 2077e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2078ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2079b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2080b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2081b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20822e5835c6SStefano Zampini v = aa + diag[i] + 1; 2083b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2084b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208517ab2063SBarry Smith } 2086b19a5dc2SMark Adams } 2087b19a5dc2SMark Adams if (xb == b) { 20889566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2089b19a5dc2SMark Adams } else { 20909566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2091b19a5dc2SMark Adams } 209217ab2063SBarry Smith } 209317ab2063SBarry Smith } 20949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20959566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 209817ab2063SBarry Smith } 209917ab2063SBarry Smith 2100ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2101d71ae5a4SJacob Faibussowitsch { 2102416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21034e220ebcSLois Curfman McInnes 21043a40ed3dSBarry Smith PetscFunctionBegin; 21054e220ebcSLois Curfman McInnes info->block_size = 1.0; 21063966268fSBarry Smith info->nz_allocated = a->maxnz; 21073966268fSBarry Smith info->nz_used = a->nz; 21083966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21093966268fSBarry Smith info->assemblies = A->num_ass; 21103966268fSBarry Smith info->mallocs = A->info.mallocs; 21114dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2112d5f3da31SBarry Smith if (A->factortype) { 21134e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21144e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21154e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21164e220ebcSLois Curfman McInnes } else { 21174e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21184e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21194e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21204e220ebcSLois Curfman McInnes } 21213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212217ab2063SBarry Smith } 212317ab2063SBarry Smith 2124ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2125d71ae5a4SJacob Faibussowitsch { 2126416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2127c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 212897b48c8fSBarry Smith const PetscScalar *xx; 21292e5835c6SStefano Zampini PetscScalar *bb, *aa; 2130c7da8527SEric Chamberland PetscInt d = 0; 213117ab2063SBarry Smith 21323a40ed3dSBarry Smith PetscFunctionBegin; 213397b48c8fSBarry Smith if (x && b) { 21349566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21359566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213697b48c8fSBarry Smith for (i = 0; i < N; i++) { 2137aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2138447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213997b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214097b48c8fSBarry Smith } 21419566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21429566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214397b48c8fSBarry Smith } 214497b48c8fSBarry Smith 21459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2146a9817697SBarry Smith if (a->keepnonzeropattern) { 2147f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2148aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21499566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2150f1e2ffcdSBarry Smith } 2151f4df32b1SMatthew Knepley if (diag != 0.0) { 2152c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2153c7da8527SEric Chamberland d = rows[i]; 2154447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215508401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2156c7da8527SEric Chamberland } 2157f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2158447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21592e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2160f1e2ffcdSBarry Smith } 2161f1e2ffcdSBarry Smith } 2162f1e2ffcdSBarry Smith } else { 2163f4df32b1SMatthew Knepley if (diag != 0.0) { 216417ab2063SBarry Smith for (i = 0; i < N; i++) { 2165aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21667ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2167447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2168447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2169447d62f5SStefano Zampini } else { 2170416022c9SBarry Smith a->ilen[rows[i]] = 1; 21712e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2172bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2173447d62f5SStefano Zampini } 2174447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21759566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217617ab2063SBarry Smith } 217717ab2063SBarry Smith } 21783a40ed3dSBarry Smith } else { 217917ab2063SBarry Smith for (i = 0; i < N; i++) { 2180aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2181416022c9SBarry Smith a->ilen[rows[i]] = 0; 218217ab2063SBarry Smith } 218317ab2063SBarry Smith } 2184e56f5c9eSBarry Smith A->nonzerostate++; 2185f1e2ffcdSBarry Smith } 21869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2187dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218917ab2063SBarry Smith } 219017ab2063SBarry Smith 2191ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2192d71ae5a4SJacob Faibussowitsch { 21936e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21946e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21952b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21966e169961SBarry Smith const PetscScalar *xx; 21972e5835c6SStefano Zampini PetscScalar *bb, *aa; 21986e169961SBarry Smith 21996e169961SBarry Smith PetscFunctionBegin; 22003ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22026e169961SBarry Smith if (x && b) { 22039566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22049566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22052b40b63fSBarry Smith vecs = PETSC_TRUE; 22066e169961SBarry Smith } 22079566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22086e169961SBarry Smith for (i = 0; i < N; i++) { 2209aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22108e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22112205254eSKarl Rupp 22126e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22136e169961SBarry Smith } 22146e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22156e169961SBarry Smith if (!zeroed[i]) { 22166e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22174cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22182e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22192e5835c6SStefano Zampini aa[j] = 0.0; 22206e169961SBarry Smith } 22216e169961SBarry Smith } 22224cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22236e169961SBarry Smith } 22246e169961SBarry Smith if (x && b) { 22259566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22269566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22276e169961SBarry Smith } 22289566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22296e169961SBarry Smith if (diag != 0.0) { 22309566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22311d5a398dSstefano_zampini if (missing) { 22321d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22334cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2234aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22359566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22361d5a398dSstefano_zampini } 22371d5a398dSstefano_zampini } else { 2238ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22396e169961SBarry Smith } 22401d5a398dSstefano_zampini } 22419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2242dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22446e169961SBarry Smith } 22456e169961SBarry Smith 2246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2247d71ae5a4SJacob Faibussowitsch { 2248fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2249fff043a9SJunchao Zhang const PetscScalar *aa; 225017ab2063SBarry Smith 22513a40ed3dSBarry Smith PetscFunctionBegin; 22529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2253416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22548e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225517ab2063SBarry Smith if (idx) { 22565c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2257f4259b30SLisandro Dalcin else *idx = NULL; 225817ab2063SBarry Smith } 22599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226117ab2063SBarry Smith } 226217ab2063SBarry Smith 2263d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2264d71ae5a4SJacob Faibussowitsch { 22653a40ed3dSBarry Smith PetscFunctionBegin; 22663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226717ab2063SBarry Smith } 226817ab2063SBarry Smith 2269ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2270d71ae5a4SJacob Faibussowitsch { 2271416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22722e5835c6SStefano Zampini const MatScalar *v; 227336db0b34SBarry Smith PetscReal sum = 0.0; 227497f1f81fSBarry Smith PetscInt i, j; 227517ab2063SBarry Smith 22763a40ed3dSBarry Smith PetscFunctionBegin; 22779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227817ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2279570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2280570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2281792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2282570b7f6dSBarry Smith #else 2283416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22849371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22859371c9d4SSatish Balay v++; 228617ab2063SBarry Smith } 22878f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2288570b7f6dSBarry Smith #endif 22899566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22903a40ed3dSBarry Smith } else if (type == NORM_1) { 229136db0b34SBarry Smith PetscReal *tmp; 229297f1f81fSBarry Smith PetscInt *jj = a->j; 22939566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2294064f8208SBarry Smith *nrm = 0.0; 2295416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22969371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22979371c9d4SSatish Balay v++; 229817ab2063SBarry Smith } 2299d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2300064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230117ab2063SBarry Smith } 23029566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23039566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23043a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2305064f8208SBarry Smith *nrm = 0.0; 2306d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23078e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 230817ab2063SBarry Smith sum = 0.0; 2309416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23109371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23119371c9d4SSatish Balay v2++; 231217ab2063SBarry Smith } 2313064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231417ab2063SBarry Smith } 23159566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2316f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231917ab2063SBarry Smith } 232017ab2063SBarry Smith 2321ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2322d71ae5a4SJacob Faibussowitsch { 23233d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232454f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23252e5835c6SStefano Zampini const MatScalar *va, *vb; 232697f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2327cd0d46ebSvictorle 2328cd0d46ebSvictorle PetscFunctionBegin; 23299566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23309566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23315485867bSBarry Smith if (ma != nb || na != mb) { 23325485867bSBarry Smith *f = PETSC_FALSE; 23333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23345485867bSBarry Smith } 23359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23379371c9d4SSatish Balay aii = aij->i; 23389371c9d4SSatish Balay bii = bij->i; 23399371c9d4SSatish Balay adx = aij->j; 23409371c9d4SSatish Balay bdx = bij->j; 23419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2343cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2344cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2345cd0d46ebSvictorle 2346cd0d46ebSvictorle *f = PETSC_TRUE; 2347cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2348cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234997f1f81fSBarry Smith PetscInt idc, idr; 23505485867bSBarry Smith PetscScalar vc, vr; 2351cd0d46ebSvictorle /* column/row index/value */ 23525485867bSBarry Smith idc = adx[aptr[i]]; 23535485867bSBarry Smith idr = bdx[bptr[idc]]; 23545485867bSBarry Smith vc = va[aptr[i]]; 23555485867bSBarry Smith vr = vb[bptr[idc]]; 23565485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23575485867bSBarry Smith *f = PETSC_FALSE; 23585485867bSBarry Smith goto done; 2359cd0d46ebSvictorle } else { 23605485867bSBarry Smith aptr[i]++; 23615485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2362cd0d46ebSvictorle } 2363cd0d46ebSvictorle } 2364cd0d46ebSvictorle } 2365cd0d46ebSvictorle done: 23669566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23679566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2371cd0d46ebSvictorle } 2372cd0d46ebSvictorle 2373ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2374d71ae5a4SJacob Faibussowitsch { 23753d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237654f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 237754f21887SBarry Smith MatScalar *va, *vb; 23781cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23791cbb95d3SBarry Smith 23801cbb95d3SBarry Smith PetscFunctionBegin; 23819566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23829566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23831cbb95d3SBarry Smith if (ma != nb || na != mb) { 23841cbb95d3SBarry Smith *f = PETSC_FALSE; 23853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23861cbb95d3SBarry Smith } 23879371c9d4SSatish Balay aii = aij->i; 23889371c9d4SSatish Balay bii = bij->i; 23899371c9d4SSatish Balay adx = aij->j; 23909371c9d4SSatish Balay bdx = bij->j; 23919371c9d4SSatish Balay va = aij->a; 23929371c9d4SSatish Balay vb = bij->a; 23939566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23951cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23961cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23971cbb95d3SBarry Smith 23981cbb95d3SBarry Smith *f = PETSC_TRUE; 23991cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24001cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24011cbb95d3SBarry Smith PetscInt idc, idr; 24021cbb95d3SBarry Smith PetscScalar vc, vr; 24031cbb95d3SBarry Smith /* column/row index/value */ 24041cbb95d3SBarry Smith idc = adx[aptr[i]]; 24051cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24061cbb95d3SBarry Smith vc = va[aptr[i]]; 24071cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24081cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24091cbb95d3SBarry Smith *f = PETSC_FALSE; 24101cbb95d3SBarry Smith goto done; 24111cbb95d3SBarry Smith } else { 24121cbb95d3SBarry Smith aptr[i]++; 24131cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24141cbb95d3SBarry Smith } 24151cbb95d3SBarry Smith } 24161cbb95d3SBarry Smith } 24171cbb95d3SBarry Smith done: 24189566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24199566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24211cbb95d3SBarry Smith } 24221cbb95d3SBarry Smith 2423d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2424d71ae5a4SJacob Faibussowitsch { 2425416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2426fff8e43fSBarry Smith const PetscScalar *l, *r; 2427fff8e43fSBarry Smith PetscScalar x; 242854f21887SBarry Smith MatScalar *v; 2429fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2430fff8e43fSBarry Smith const PetscInt *jj; 243117ab2063SBarry Smith 24323a40ed3dSBarry Smith PetscFunctionBegin; 243317ab2063SBarry Smith if (ll) { 24343ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24353ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24369566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 243708401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24389566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 244017ab2063SBarry Smith for (i = 0; i < m; i++) { 244117ab2063SBarry Smith x = l[i]; 2442416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24432205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244417ab2063SBarry Smith } 24459566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 244817ab2063SBarry Smith } 244917ab2063SBarry Smith if (rr) { 24509566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 245108401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24529566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24542e5835c6SStefano Zampini jj = a->j; 24552205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24579566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24589566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 245917ab2063SBarry Smith } 24609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 246217ab2063SBarry Smith } 246317ab2063SBarry Smith 2464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2465d71ae5a4SJacob Faibussowitsch { 2466db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2467d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 246897f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24695d0c19d7SBarry Smith const PetscInt *irow, *icol; 24702e5835c6SStefano Zampini const PetscScalar *aa; 24715d0c19d7SBarry Smith PetscInt nrows, ncols; 247297f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2473fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2474416022c9SBarry Smith Mat C; 2475cdc6f3adSToby Isaac PetscBool stride; 247617ab2063SBarry Smith 24773a40ed3dSBarry Smith PetscFunctionBegin; 24789566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24799566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24809566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 248117ab2063SBarry Smith 24829566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2483ff718158SBarry Smith if (stride) { 24849566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2485ff718158SBarry Smith } else { 2486ff718158SBarry Smith first = 0; 2487ff718158SBarry Smith step = 0; 2488ff718158SBarry Smith } 2489fee21e36SBarry Smith if (stride && step == 1) { 249002834360SBarry Smith /* special case of contiguous rows */ 24919566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 249202834360SBarry Smith /* loop over new rows determining lens and starting points */ 249302834360SBarry Smith for (i = 0; i < nrows; i++) { 2494bfeeae90SHong Zhang kstart = ai[irow[i]]; 2495a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2496a91a9bebSLisandro Dalcin starts[i] = kstart; 249702834360SBarry Smith for (k = kstart; k < kend; k++) { 2498bfeeae90SHong Zhang if (aj[k] >= first) { 249902834360SBarry Smith starts[i] = k; 250002834360SBarry Smith break; 250102834360SBarry Smith } 250202834360SBarry Smith } 2503a2744918SBarry Smith sum = 0; 250402834360SBarry Smith while (k < kend) { 2505bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2506a2744918SBarry Smith sum++; 250702834360SBarry Smith } 2508a2744918SBarry Smith lens[i] = sum; 250902834360SBarry Smith } 251002834360SBarry Smith /* create submatrix */ 2511cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 251297f1f81fSBarry Smith PetscInt n_cols, n_rows; 25139566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2514aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25159566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251608480c60SBarry Smith C = *B; 25173a40ed3dSBarry Smith } else { 25183bef6203SJed Brown PetscInt rbs, cbs; 25199566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25209566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25219566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25229566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25239566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25249566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252608480c60SBarry Smith } 2527db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2528db02288aSLois Curfman McInnes 252902834360SBarry Smith /* loop over rows inserting into submatrix */ 2530fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2531db02288aSLois Curfman McInnes j_new = c->j; 2532db02288aSLois Curfman McInnes i_new = c->i; 25339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253402834360SBarry Smith for (i = 0; i < nrows; i++) { 2535a2744918SBarry Smith ii = starts[i]; 2536a2744918SBarry Smith lensi = lens[i]; 2537810441c8SPierre Jolivet if (lensi) { 2538ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25399566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2540a2744918SBarry Smith a_new += lensi; 2541810441c8SPierre Jolivet } 2542a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2543a2744918SBarry Smith c->ilen[i] = lensi; 254402834360SBarry Smith } 2545fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25479566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25483a40ed3dSBarry Smith } else { 25499566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25524dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25536bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25544dcab191SBarry Smith smap[icol[i]] = i + 1; 25554dcab191SBarry Smith } 25564dcab191SBarry Smith 255702834360SBarry Smith /* determine lens of each row */ 255802834360SBarry Smith for (i = 0; i < nrows; i++) { 2559bfeeae90SHong Zhang kstart = ai[irow[i]]; 256002834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 256102834360SBarry Smith lens[i] = 0; 256202834360SBarry Smith for (k = kstart; k < kend; k++) { 2563ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256402834360SBarry Smith } 256502834360SBarry Smith } 256617ab2063SBarry Smith /* Create and fill new matrix */ 2567a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2568ace3abfcSBarry Smith PetscBool equal; 25690f5bd95cSBarry Smith 257099141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2571aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25729566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2573fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25749566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257508480c60SBarry Smith C = *B; 25763a40ed3dSBarry Smith } else { 25773bef6203SJed Brown PetscInt rbs, cbs; 25789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25799566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25809566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25819566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 258237a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25839566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258508480c60SBarry Smith } 25869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2587fb3c7e2dSJunchao Zhang 2588f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2589fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 259017ab2063SBarry Smith for (i = 0; i < nrows; i++) { 259199141d43SSatish Balay row = irow[i]; 2592bfeeae90SHong Zhang kstart = ai[row]; 259399141d43SSatish Balay kend = kstart + a->ilen[row]; 2594bfeeae90SHong Zhang mat_i = c->i[i]; 25958e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25968e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 259799141d43SSatish Balay mat_ilen = c->ilen + i; 259817ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2599bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2600ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26012e5835c6SStefano Zampini *mat_a++ = aa[k]; 260299141d43SSatish Balay (*mat_ilen)++; 260317ab2063SBarry Smith } 260417ab2063SBarry Smith } 260517ab2063SBarry Smith } 26069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260702834360SBarry Smith /* Free work space */ 26089566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26099566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26109566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2611cdc6f3adSToby Isaac /* sort */ 2612cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2613cdc6f3adSToby Isaac PetscInt ilen; 2614cdc6f3adSToby Isaac 2615cdc6f3adSToby Isaac mat_i = c->i[i]; 26168e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26178e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2618cdc6f3adSToby Isaac ilen = c->ilen[i]; 26199566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2620cdc6f3adSToby Isaac } 2621fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 262202834360SBarry Smith } 26238c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26249566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2625305c6ccfSStefano Zampini #endif 26269566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26279566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262817ab2063SBarry Smith 26299566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2630416022c9SBarry Smith *B = C; 26313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 263217ab2063SBarry Smith } 263317ab2063SBarry Smith 2634ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2635d71ae5a4SJacob Faibussowitsch { 263682d44351SHong Zhang Mat B; 263782d44351SHong Zhang 263882d44351SHong Zhang PetscFunctionBegin; 2639c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26409566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26419566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26429566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26439566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26449566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264582d44351SHong Zhang *subMat = B; 2646c2d650bdSHong Zhang } else { 26479566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2648c2d650bdSHong Zhang } 26493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265082d44351SHong Zhang } 265182d44351SHong Zhang 2652ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2653d71ae5a4SJacob Faibussowitsch { 265463b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265563b91edcSBarry Smith Mat outA; 2656ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265763b91edcSBarry Smith 26583a40ed3dSBarry Smith PetscFunctionBegin; 265908401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26601df811f5SHong Zhang 26619566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26629566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2663a871dcd8SBarry Smith 266463b91edcSBarry Smith outA = inA; 2665d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26669566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26679566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26682205254eSKarl Rupp 26699566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26709566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26712205254eSKarl Rupp 2672c3122656SLisandro Dalcin a->row = row; 26732205254eSKarl Rupp 26749566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26759566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26762205254eSKarl Rupp 2677c3122656SLisandro Dalcin a->col = col; 267863b91edcSBarry Smith 267936db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26809566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26819566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2682f0ec6fceSSatish Balay 268394a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268594a9d846SBarry Smith } 268663b91edcSBarry Smith 26879566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2688137fb511SHong Zhang if (row_identity && col_identity) { 26899566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2690137fb511SHong Zhang } else { 26919566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2692137fb511SHong Zhang } 26933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2694a871dcd8SBarry Smith } 2695a871dcd8SBarry Smith 2696d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2697d71ae5a4SJacob Faibussowitsch { 2698f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2699dfa0f9e5SStefano Zampini PetscScalar *v; 2700c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27013a40ed3dSBarry Smith 27023a40ed3dSBarry Smith PetscFunctionBegin; 27039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27049566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2705792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27069566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2710f0b747eeSBarry Smith } 2711f0b747eeSBarry Smith 2712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2713d71ae5a4SJacob Faibussowitsch { 271416b64355SHong Zhang PetscInt i; 271516b64355SHong Zhang 271616b64355SHong Zhang PetscFunctionBegin; 271716b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27189566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271916b64355SHong Zhang 272048a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 272216b64355SHong Zhang 272316b64355SHong Zhang if (submatj->rbuf1) { 27249566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272616b64355SHong Zhang } 272716b64355SHong Zhang 272848a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27299566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27309566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 273116b64355SHong Zhang } 273216b64355SHong Zhang 273316b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2734eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27359566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27369566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273716b64355SHong Zhang #else 27389566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273916b64355SHong Zhang #endif 274016b64355SHong Zhang 274116b64355SHong Zhang if (!submatj->allcolumns) { 274216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2743835f2295SStefano Zampini PetscCall(PetscHMapIDestroy(&submatj->cmap)); 274416b64355SHong Zhang #else 27459566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274616b64355SHong Zhang #endif 274716b64355SHong Zhang } 27489566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274916b64355SHong Zhang 27509566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275216b64355SHong Zhang } 275316b64355SHong Zhang 2754d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2755d71ae5a4SJacob Faibussowitsch { 275616b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27575c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275816b64355SHong Zhang 275916b64355SHong Zhang PetscFunctionBegin; 27609566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27619566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 276316b64355SHong Zhang } 276416b64355SHong Zhang 276589a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2766ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2767d71ae5a4SJacob Faibussowitsch { 27682d033e1fSHong Zhang PetscInt i; 27690fb991dcSHong Zhang Mat C; 27700fb991dcSHong Zhang Mat_SeqAIJ *c; 27710fb991dcSHong Zhang Mat_SubSppt *submatj; 27722d033e1fSHong Zhang 27732d033e1fSHong Zhang PetscFunctionBegin; 27742d033e1fSHong Zhang for (i = 0; i < n; i++) { 27750fb991dcSHong Zhang C = (*mat)[i]; 27760fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27770fb991dcSHong Zhang submatj = c->submatis1; 27782d033e1fSHong Zhang if (submatj) { 2779682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 278026cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27819566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27829566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27839566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27843faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27859566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27869566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27879566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2788682e4c99SStefano Zampini } 27892d033e1fSHong Zhang } else { 27909566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27912d033e1fSHong Zhang } 27922d033e1fSHong Zhang } 279386e85357SHong Zhang 279463a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27959566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279663a75b2aSHong Zhang 27979566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27992d033e1fSHong Zhang } 28002d033e1fSHong Zhang 2801ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2802d71ae5a4SJacob Faibussowitsch { 280397f1f81fSBarry Smith PetscInt i; 2804cddf8d76SBarry Smith 28053a40ed3dSBarry Smith PetscFunctionBegin; 280648a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2807cddf8d76SBarry Smith 280848a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2810cddf8d76SBarry Smith } 2811cddf8d76SBarry Smith 2812ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2813d71ae5a4SJacob Faibussowitsch { 2814e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28159a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28165d0c19d7SBarry Smith const PetscInt *idx; 28179a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2818f1af5d2fSBarry Smith PetscBT table; 2819bbd702dbSSatish Balay 28203a40ed3dSBarry Smith PetscFunctionBegin; 28219a88ca10SBarry Smith m = A->rmap->n / bs; 2822e4d965acSSatish Balay ai = a->i; 2823bfeeae90SHong Zhang aj = a->j; 28248a047759SSatish Balay 282508401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282606763907SSatish Balay 28279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28289566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282906763907SSatish Balay 2830e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2831b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2832e4d965acSSatish Balay isz = 0; 28339566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2834e4d965acSSatish Balay 2835e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28369566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28379566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2838e4d965acSSatish Balay 28399a88ca10SBarry Smith if (bs > 1) { 28409a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28419a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28429a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28439a88ca10SBarry Smith } 28449a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28459a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28469a88ca10SBarry Smith 28479a88ca10SBarry Smith k = 0; 28489a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28499a88ca10SBarry Smith n = isz; 28509a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28519a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28529a88ca10SBarry Smith row = bs * nidx[k] + ll; 28539a88ca10SBarry Smith start = ai[row]; 28549a88ca10SBarry Smith end = ai[row + 1]; 28559a88ca10SBarry Smith for (l = start; l < end; l++) { 28569a88ca10SBarry Smith val = aj[l] / bs; 28579a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28589a88ca10SBarry Smith } 28599a88ca10SBarry Smith } 28609a88ca10SBarry Smith } 28619a88ca10SBarry Smith } 286257508eceSPierre Jolivet PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i)); 28639a88ca10SBarry Smith } else { 2864dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2865e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28662205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28674dcbc457SBarry Smith } 28689566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28699566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2870e4d965acSSatish Balay 287104a348a9SBarry Smith k = 0; 287204a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 287304a348a9SBarry Smith n = isz; 287406763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2875e4d965acSSatish Balay row = nidx[k]; 2876e4d965acSSatish Balay start = ai[row]; 2877e4d965acSSatish Balay end = ai[row + 1]; 287804a348a9SBarry Smith for (l = start; l < end; l++) { 2879efb16452SHong Zhang val = aj[l]; 28802205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2881e4d965acSSatish Balay } 2882e4d965acSSatish Balay } 2883e4d965acSSatish Balay } 288457508eceSPierre Jolivet PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i)); 2885e4d965acSSatish Balay } 28869a88ca10SBarry Smith } 28879566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28889566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28904dcbc457SBarry Smith } 289117ab2063SBarry Smith 2892ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2893d71ae5a4SJacob Faibussowitsch { 28940513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28953b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28965d0c19d7SBarry Smith const PetscInt *row, *col; 28975d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 289856cd22aeSBarry Smith IS icolp, irowp; 28990298fd71SBarry Smith PetscInt *cwork = NULL; 29000298fd71SBarry Smith PetscScalar *vwork = NULL; 29010513a670SBarry Smith 29023a40ed3dSBarry Smith PetscFunctionBegin; 29039566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29049566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29059566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29069566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29070513a670SBarry Smith 29080513a670SBarry Smith /* determine lengths of permuted rows */ 29099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29102205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29119566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29129566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29139566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29149566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29169566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29170513a670SBarry Smith 29189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29190513a670SBarry Smith for (i = 0; i < m; i++) { 29209566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29212205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29229566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29239566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29240513a670SBarry Smith } 29259566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29262205254eSKarl Rupp 29273c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29282205254eSKarl Rupp 29298c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29309566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29319fe5e383SStefano Zampini #endif 29329566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29339566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29349566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29359566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29369566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 293848a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29400513a670SBarry Smith } 29410513a670SBarry Smith 2942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2943d71ae5a4SJacob Faibussowitsch { 2944cb5b572fSBarry Smith PetscFunctionBegin; 294533f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294633f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2947be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2948be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29492e5835c6SStefano Zampini const PetscScalar *aa; 2950be6bf707SBarry Smith 29519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 295208401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29549566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2956cb5b572fSBarry Smith } else { 29579566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2958cb5b572fSBarry Smith } 29593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2960cb5b572fSBarry Smith } 2961cb5b572fSBarry Smith 2962d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2963d71ae5a4SJacob Faibussowitsch { 29646c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29656e111a19SKarl Rupp 29666c0721eeSBarry Smith PetscFunctionBegin; 29676c0721eeSBarry Smith *array = a->a; 29683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29696c0721eeSBarry Smith } 29706c0721eeSBarry Smith 2971d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2972d71ae5a4SJacob Faibussowitsch { 29736c0721eeSBarry Smith PetscFunctionBegin; 2974f38c1e66SStefano Zampini *array = NULL; 29753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29766c0721eeSBarry Smith } 2977273d9f13SBarry Smith 29788229c054SShri Abhyankar /* 29798229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29808229c054SShri Abhyankar have different nonzero structure. 29818229c054SShri Abhyankar */ 2982d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2983d71ae5a4SJacob Faibussowitsch { 2984b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2985ec7775f6SShri Abhyankar 2986ec7775f6SShri Abhyankar PetscFunctionBegin; 2987ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2988ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29898e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2990b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2991b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29928af7cee1SJed Brown nnz[i] = 0; 29938af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2994b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2995b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29968af7cee1SJed Brown nnz[i]++; 29978af7cee1SJed Brown } 29988af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2999ec7775f6SShri Abhyankar } 30003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3001ec7775f6SShri Abhyankar } 3002ec7775f6SShri Abhyankar 3003d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3004d71ae5a4SJacob Faibussowitsch { 3005b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3006b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3007b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3008b264fe52SHong Zhang 3009b264fe52SHong Zhang PetscFunctionBegin; 3010b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30119566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3013b264fe52SHong Zhang } 3014b264fe52SHong Zhang 3015d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3016d71ae5a4SJacob Faibussowitsch { 3017ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3018ac90fabeSBarry Smith 3019ac90fabeSBarry Smith PetscFunctionBegin; 3020134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3021134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3022134adf20SPierre Jolivet if (e) { 30239566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302481fa06acSBarry Smith if (e) { 30259566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3026134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 302781fa06acSBarry Smith } 302881fa06acSBarry Smith } 302954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 303081fa06acSBarry Smith } 3031ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30322e5835c6SStefano Zampini const PetscScalar *xa; 30332e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303481fa06acSBarry Smith PetscBLASInt one = 1, bnz; 303581fa06acSBarry Smith 30369566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3039792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30429566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30449566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3045ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30469566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3047ac90fabeSBarry Smith } else { 30488229c054SShri Abhyankar Mat B; 30498229c054SShri Abhyankar PetscInt *nnz; 30509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30519566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30529566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30539566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30549566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30559566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30579566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30589566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30599bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30609566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3061ac90fabeSBarry Smith } 30623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3063ac90fabeSBarry Smith } 3064ac90fabeSBarry Smith 3065d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3066d71ae5a4SJacob Faibussowitsch { 3067354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3068354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3069354c94deSBarry Smith PetscInt i, nz; 3070354c94deSBarry Smith PetscScalar *a; 3071354c94deSBarry Smith 3072354c94deSBarry Smith PetscFunctionBegin; 3073354c94deSBarry Smith nz = aij->nz; 30749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30752205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3077354c94deSBarry Smith #else 3078354c94deSBarry Smith PetscFunctionBegin; 3079354c94deSBarry Smith #endif 30803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3081354c94deSBarry Smith } 3082354c94deSBarry Smith 3083ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3084d71ae5a4SJacob Faibussowitsch { 3085e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3086d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3087e34fafa9SBarry Smith PetscReal atmp; 3088985db425SBarry Smith PetscScalar *x; 3089ce496241SStefano Zampini const MatScalar *aa, *av; 3090e34fafa9SBarry Smith 3091e34fafa9SBarry Smith PetscFunctionBegin; 309228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3094ce496241SStefano Zampini aa = av; 3095e34fafa9SBarry Smith ai = a->i; 3096e34fafa9SBarry Smith aj = a->j; 3097e34fafa9SBarry Smith 30989566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30999566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 310008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3101e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31029371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31039371c9d4SSatish Balay ai++; 310462e5df07SMark Adams x[i] = 0; 3105e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3106985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31079371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31089371c9d4SSatish Balay x[i] = atmp; 31099371c9d4SSatish Balay if (idx) idx[i] = *aj; 31109371c9d4SSatish Balay } 31119371c9d4SSatish Balay aa++; 31129371c9d4SSatish Balay aj++; 3113985db425SBarry Smith } 3114985db425SBarry Smith } 31159566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3118985db425SBarry Smith } 3119985db425SBarry Smith 3120eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3121eede4a3fSMark Adams { 3122eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3123eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3124eede4a3fSMark Adams PetscScalar *x; 3125eede4a3fSMark Adams const MatScalar *aa, *av; 3126eede4a3fSMark Adams 3127eede4a3fSMark Adams PetscFunctionBegin; 3128eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3129eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3130eede4a3fSMark Adams aa = av; 3131eede4a3fSMark Adams ai = a->i; 3132eede4a3fSMark Adams 3133eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3134eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3135eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3136eede4a3fSMark Adams for (i = 0; i < m; i++) { 3137eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3138eede4a3fSMark Adams ai++; 313962e5df07SMark Adams x[i] = 0; 3140eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3141eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3142eede4a3fSMark Adams aa++; 3143eede4a3fSMark Adams } 3144eede4a3fSMark Adams } 3145eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3146eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3147eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3148eede4a3fSMark Adams } 3149eede4a3fSMark Adams 3150ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3151d71ae5a4SJacob Faibussowitsch { 3152985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3153d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3154985db425SBarry Smith PetscScalar *x; 3155ce496241SStefano Zampini const MatScalar *aa, *av; 3156985db425SBarry Smith 3157985db425SBarry Smith PetscFunctionBegin; 315828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3160ce496241SStefano Zampini aa = av; 3161985db425SBarry Smith ai = a->i; 3162985db425SBarry Smith aj = a->j; 3163985db425SBarry Smith 31649566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31659566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3167985db425SBarry Smith for (i = 0; i < m; i++) { 31689371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31699371c9d4SSatish Balay ai++; 3170d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31719371c9d4SSatish Balay x[i] = *aa; 31729371c9d4SSatish Balay if (idx) idx[i] = 0; 3173985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3174985db425SBarry Smith x[i] = 0.0; 3175985db425SBarry Smith if (idx) { 3176985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3177985db425SBarry Smith if (aj[j] > j) { 3178985db425SBarry Smith idx[i] = j; 3179985db425SBarry Smith break; 3180985db425SBarry Smith } 3181985db425SBarry Smith } 31821a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31831a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3184985db425SBarry Smith } 3185985db425SBarry Smith } 3186985db425SBarry Smith for (j = 0; j < ncols; j++) { 31879371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31889371c9d4SSatish Balay x[i] = *aa; 31899371c9d4SSatish Balay if (idx) idx[i] = *aj; 31909371c9d4SSatish Balay } 31919371c9d4SSatish Balay aa++; 31929371c9d4SSatish Balay aj++; 3193985db425SBarry Smith } 3194985db425SBarry Smith } 31959566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3198985db425SBarry Smith } 3199985db425SBarry Smith 3200ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3201d71ae5a4SJacob Faibussowitsch { 3202c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3203c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3204ce496241SStefano Zampini PetscScalar *x; 3205ce496241SStefano Zampini const MatScalar *aa, *av; 3206c87e5d42SMatthew Knepley 3207c87e5d42SMatthew Knepley PetscFunctionBegin; 32089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3209ce496241SStefano Zampini aa = av; 3210c87e5d42SMatthew Knepley ai = a->i; 3211c87e5d42SMatthew Knepley aj = a->j; 3212c87e5d42SMatthew Knepley 32139566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32149566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321508401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3216c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32179371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32189371c9d4SSatish Balay ai++; 3219f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32209371c9d4SSatish Balay x[i] = *aa; 32219371c9d4SSatish Balay if (idx) idx[i] = 0; 3222f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3223f07e67edSHong Zhang x[i] = 0.0; 3224f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3225289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3226f07e67edSHong Zhang if (aj[j] > j) { 3227f07e67edSHong Zhang idx[i] = j; 32282205254eSKarl Rupp break; 32292205254eSKarl Rupp } 3230289a08f5SMatthew Knepley } 3231f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3232f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3233f07e67edSHong Zhang } 3234289a08f5SMatthew Knepley } 3235c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32369371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32379371c9d4SSatish Balay x[i] = *aa; 32389371c9d4SSatish Balay if (idx) idx[i] = *aj; 32399371c9d4SSatish Balay } 32409371c9d4SSatish Balay aa++; 32419371c9d4SSatish Balay aj++; 3242c87e5d42SMatthew Knepley } 3243c87e5d42SMatthew Knepley } 32449566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3247c87e5d42SMatthew Knepley } 3248c87e5d42SMatthew Knepley 3249ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3250d71ae5a4SJacob Faibussowitsch { 3251985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3252d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3253d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3254985db425SBarry Smith PetscScalar *x; 3255ce496241SStefano Zampini const MatScalar *aa, *av; 3256985db425SBarry Smith 3257985db425SBarry Smith PetscFunctionBegin; 325828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3260ce496241SStefano Zampini aa = av; 3261985db425SBarry Smith ai = a->i; 3262985db425SBarry Smith aj = a->j; 3263985db425SBarry Smith 32649566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32659566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 326608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3267985db425SBarry Smith for (i = 0; i < m; i++) { 32689371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32699371c9d4SSatish Balay ai++; 3270d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32719371c9d4SSatish Balay x[i] = *aa; 32729371c9d4SSatish Balay if (idx) idx[i] = 0; 3273985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3274985db425SBarry Smith x[i] = 0.0; 3275985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3276985db425SBarry Smith for (j = 0; j < ncols; j++) { 3277985db425SBarry Smith if (aj[j] > j) { 3278985db425SBarry Smith idx[i] = j; 3279985db425SBarry Smith break; 3280985db425SBarry Smith } 3281985db425SBarry Smith } 3282fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3283fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3284985db425SBarry Smith } 3285985db425SBarry Smith } 3286985db425SBarry Smith for (j = 0; j < ncols; j++) { 32879371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32889371c9d4SSatish Balay x[i] = *aa; 32899371c9d4SSatish Balay if (idx) idx[i] = *aj; 32909371c9d4SSatish Balay } 32919371c9d4SSatish Balay aa++; 32929371c9d4SSatish Balay aj++; 3293e34fafa9SBarry Smith } 3294e34fafa9SBarry Smith } 32959566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3298e34fafa9SBarry Smith } 3299bbead8a2SBarry Smith 3300ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3301d71ae5a4SJacob Faibussowitsch { 3302bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 330333d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3304bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33050da83c2eSBarry Smith const PetscReal shift = 0.0; 33061a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3307bbead8a2SBarry Smith 3308bbead8a2SBarry Smith PetscFunctionBegin; 3309a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33104a0d0026SBarry Smith if (a->ibdiagvalid) { 33114a0d0026SBarry Smith if (values) *values = a->ibdiag; 33123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33134a0d0026SBarry Smith } 33149566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33154dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3316bbead8a2SBarry Smith diag = a->ibdiag; 3317bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3318bbead8a2SBarry Smith /* factor and invert each block */ 3319bbead8a2SBarry Smith switch (bs) { 3320bbead8a2SBarry Smith case 1: 3321bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33229566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3323ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3324ec1892c8SHong Zhang if (allowzeropivot) { 33257b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33267b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33277b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33289566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 332998921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3330ec1892c8SHong Zhang } 3331bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3332bbead8a2SBarry Smith } 3333bbead8a2SBarry Smith break; 3334bbead8a2SBarry Smith case 2: 3335bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33369371c9d4SSatish Balay ij[0] = 2 * i; 33379371c9d4SSatish Balay ij[1] = 2 * i + 1; 33389566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33407b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33419566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3342bbead8a2SBarry Smith diag += 4; 3343bbead8a2SBarry Smith } 3344bbead8a2SBarry Smith break; 3345bbead8a2SBarry Smith case 3: 3346bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33479371c9d4SSatish Balay ij[0] = 3 * i; 33489371c9d4SSatish Balay ij[1] = 3 * i + 1; 33499371c9d4SSatish Balay ij[2] = 3 * i + 2; 33509566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33527b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33539566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3354bbead8a2SBarry Smith diag += 9; 3355bbead8a2SBarry Smith } 3356bbead8a2SBarry Smith break; 3357bbead8a2SBarry Smith case 4: 3358bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33599371c9d4SSatish Balay ij[0] = 4 * i; 33609371c9d4SSatish Balay ij[1] = 4 * i + 1; 33619371c9d4SSatish Balay ij[2] = 4 * i + 2; 33629371c9d4SSatish Balay ij[3] = 4 * i + 3; 33639566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33657b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3367bbead8a2SBarry Smith diag += 16; 3368bbead8a2SBarry Smith } 3369bbead8a2SBarry Smith break; 3370bbead8a2SBarry Smith case 5: 3371bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33729371c9d4SSatish Balay ij[0] = 5 * i; 33739371c9d4SSatish Balay ij[1] = 5 * i + 1; 33749371c9d4SSatish Balay ij[2] = 5 * i + 2; 33759371c9d4SSatish Balay ij[3] = 5 * i + 3; 33769371c9d4SSatish Balay ij[4] = 5 * i + 4; 33779566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33789566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33797b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3381bbead8a2SBarry Smith diag += 25; 3382bbead8a2SBarry Smith } 3383bbead8a2SBarry Smith break; 3384bbead8a2SBarry Smith case 6: 3385bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33869371c9d4SSatish Balay ij[0] = 6 * i; 33879371c9d4SSatish Balay ij[1] = 6 * i + 1; 33889371c9d4SSatish Balay ij[2] = 6 * i + 2; 33899371c9d4SSatish Balay ij[3] = 6 * i + 3; 33909371c9d4SSatish Balay ij[4] = 6 * i + 4; 33919371c9d4SSatish Balay ij[5] = 6 * i + 5; 33929566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33939566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33947b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33959566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3396bbead8a2SBarry Smith diag += 36; 3397bbead8a2SBarry Smith } 3398bbead8a2SBarry Smith break; 3399bbead8a2SBarry Smith case 7: 3400bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 34019371c9d4SSatish Balay ij[0] = 7 * i; 34029371c9d4SSatish Balay ij[1] = 7 * i + 1; 34039371c9d4SSatish Balay ij[2] = 7 * i + 2; 34049371c9d4SSatish Balay ij[3] = 7 * i + 3; 34059371c9d4SSatish Balay ij[4] = 7 * i + 4; 34069371c9d4SSatish Balay ij[5] = 7 * i + 5; 3407cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34089566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34099566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34107b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34119566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3412bbead8a2SBarry Smith diag += 49; 3413bbead8a2SBarry Smith } 3414bbead8a2SBarry Smith break; 3415bbead8a2SBarry Smith default: 34169566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3417bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3418ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34199566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34209566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34217b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34229566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3423bbead8a2SBarry Smith diag += bs2; 3424bbead8a2SBarry Smith } 34259566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3426bbead8a2SBarry Smith } 3427bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3429bbead8a2SBarry Smith } 3430bbead8a2SBarry Smith 3431d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3432d71ae5a4SJacob Faibussowitsch { 343373a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3434fff043a9SJunchao Zhang PetscScalar a, *aa; 343573a71a0fSBarry Smith PetscInt m, n, i, j, col; 343673a71a0fSBarry Smith 343773a71a0fSBarry Smith PetscFunctionBegin; 343873a71a0fSBarry Smith if (!x->assembled) { 34399566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 344073a71a0fSBarry Smith for (i = 0; i < m; i++) { 344173a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34429566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 344373a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34449566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 344573a71a0fSBarry Smith } 344673a71a0fSBarry Smith } 3447e2ce353bSJunchao Zhang } else { 34489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34499566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3451e2ce353bSJunchao Zhang } 34529566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34539566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 345573a71a0fSBarry Smith } 345673a71a0fSBarry Smith 3457679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3458d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3459d71ae5a4SJacob Faibussowitsch { 3460679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3461679944adSJunchao Zhang PetscScalar a; 3462679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3463679944adSJunchao Zhang 3464679944adSJunchao Zhang PetscFunctionBegin; 3465679944adSJunchao Zhang nskip = high - low; 34669566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3467679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3468679944adSJunchao Zhang for (i = 0; i < m; i++) { 3469679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34709566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3471679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3472679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34739566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3474679944adSJunchao Zhang } 3475e2ce353bSJunchao Zhang } 34769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3479679944adSJunchao Zhang } 3480679944adSJunchao Zhang 34810a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3482cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3483cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3484cb5b572fSBarry Smith MatMult_SeqAIJ, 348597304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34867c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34877c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3488f4259b30SLisandro Dalcin NULL, 3489f4259b30SLisandro Dalcin NULL, 3490f4259b30SLisandro Dalcin NULL, 3491f4259b30SLisandro Dalcin /* 10*/ NULL, 3492cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3493f4259b30SLisandro Dalcin NULL, 349441f059aeSBarry Smith MatSOR_SeqAIJ, 349591e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349697304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3497cb5b572fSBarry Smith MatEqual_SeqAIJ, 3498cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3499cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3500cb5b572fSBarry Smith MatNorm_SeqAIJ, 3501f4259b30SLisandro Dalcin /* 20*/ NULL, 3502cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3503cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3504cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3505d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 351026cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3511f4259b30SLisandro Dalcin NULL, 3512f4259b30SLisandro Dalcin NULL, 3513f4259b30SLisandro Dalcin NULL, 3514f4259b30SLisandro Dalcin NULL, 3515d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3516f4259b30SLisandro Dalcin NULL, 3517f4259b30SLisandro Dalcin NULL, 3518cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3519f4259b30SLisandro Dalcin NULL, 3520d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35217dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3522cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3523cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3524cb5b572fSBarry Smith MatCopy_SeqAIJ, 3525d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3526cb5b572fSBarry Smith MatScale_SeqAIJ, 35277d68702bSBarry Smith MatShift_SeqAIJ, 352879299369SBarry Smith MatDiagonalSet_SeqAIJ, 35296e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 353073a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35313b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35323b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35333b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3534a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 353593dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3536f4259b30SLisandro Dalcin NULL, 3537f4259b30SLisandro Dalcin NULL, 3538cda55fadSBarry Smith MatPermute_SeqAIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin /* 59*/ NULL, 3541b9b97703SBarry Smith MatDestroy_SeqAIJ, 3542b9b97703SBarry Smith MatView_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin /* 64*/ NULL, 3546321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3551c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin /* 74*/ NULL, 35563acb8795SBarry Smith MatFDColoringApply_AIJ, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 35606ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 3564bc011b1eSHong Zhang MatLoad_SeqAIJ, 35656cff0a6bSPierre Jolivet /* 84*/ NULL, 35666cff0a6bSPierre Jolivet NULL, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin /* 89*/ NULL, 3571f4259b30SLisandro Dalcin NULL, 357226be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 35758fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3576f4259b30SLisandro Dalcin NULL, 3577f4259b30SLisandro Dalcin NULL, 35786fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3579f4259b30SLisandro Dalcin NULL, 35804222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3581f4259b30SLisandro Dalcin NULL, 3582f4259b30SLisandro Dalcin NULL, 358387d4246cSBarry Smith MatConjugate_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 3585d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 358699cafbc1SBarry Smith MatRealPart_SeqAIJ, 3587f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3591f4259b30SLisandro Dalcin NULL, 35922af78befSBarry Smith MatGetRowMin_SeqAIJ, 3593f4259b30SLisandro Dalcin NULL, 3594599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3595f4259b30SLisandro Dalcin /*114*/ NULL, 3596f4259b30SLisandro Dalcin NULL, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 3599f4259b30SLisandro Dalcin NULL, 3600f4259b30SLisandro Dalcin /*119*/ NULL, 3601f4259b30SLisandro Dalcin NULL, 3602f4259b30SLisandro Dalcin NULL, 3603f4259b30SLisandro Dalcin NULL, 3604b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36050716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3606a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360737868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36080da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin /*129*/ NULL, 3611f4259b30SLisandro Dalcin NULL, 3612f4259b30SLisandro Dalcin NULL, 361375648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3614b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3615b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36162b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3617f4259b30SLisandro Dalcin NULL, 3618f4259b30SLisandro Dalcin NULL, 36193964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3620f4259b30SLisandro Dalcin /*139*/ NULL, 3621f4259b30SLisandro Dalcin NULL, 3622f4259b30SLisandro Dalcin NULL, 36233a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36249c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36254222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36264222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3627f4259b30SLisandro Dalcin NULL, 362872833a62Smarkadams4 NULL, 362972833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36302d776b49SBarry Smith NULL, 3631dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3632eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 36334cc2b5b5SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 363442ce410bSJunchao Zhang NULL, 363542ce410bSJunchao Zhang NULL, 3636fe1fc275SAlexander /*155*/ NULL, 3637fe1fc275SAlexander MatCopyHashToXAIJ_Seq_Hash}; 363817ab2063SBarry Smith 3639ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3640d71ae5a4SJacob Faibussowitsch { 3641bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 364297f1f81fSBarry Smith PetscInt i, nz, n; 3643bef8e0ddSBarry Smith 3644bef8e0ddSBarry Smith PetscFunctionBegin; 3645bef8e0ddSBarry Smith nz = aij->maxnz; 3646d0f46423SBarry Smith n = mat->rmap->n; 3647ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3648bef8e0ddSBarry Smith aij->nz = nz; 3649ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3651bef8e0ddSBarry Smith } 3652bef8e0ddSBarry Smith 3653a3bb6f32SFande Kong /* 3654ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3655ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3656ddea5d60SJunchao Zhang */ 3657d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3658d71ae5a4SJacob Faibussowitsch { 3659a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3660eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3661eec179cfSJacob Faibussowitsch PetscHashIter tpos; 366225b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 366325b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3664a3bb6f32SFande Kong 3665a3bb6f32SFande Kong PetscFunctionBegin; 3666a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36674f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3668a3bb6f32SFande Kong /* use a table */ 3669eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3670a3bb6f32SFande Kong ec = 0; 367125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 367225b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3673eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3674a3bb6f32SFande Kong if (!data) { 3675a3bb6f32SFande Kong /* one based table */ 3676c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3677a3bb6f32SFande Kong } 3678a3bb6f32SFande Kong } 3679a3bb6f32SFande Kong /* form array of columns we need */ 36809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3681eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3682eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3683eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3684eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3685eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3686a3bb6f32SFande Kong gid--; 3687a3bb6f32SFande Kong lid--; 3688a3bb6f32SFande Kong garray[lid] = gid; 3689a3bb6f32SFande Kong } 36909566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3691eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3692c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3693a3bb6f32SFande Kong /* compact out the extra columns in B */ 369425b670f0SStefano Zampini for (i = 0; i < nz; i++) { 369525b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3696eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3697a3bb6f32SFande Kong lid--; 369825b670f0SStefano Zampini jj[i] = lid; 3699a3bb6f32SFande Kong } 37009566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3701eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 37029566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 37039566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 37049566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3706a3bb6f32SFande Kong } 3707a3bb6f32SFande Kong 3708bef8e0ddSBarry Smith /*@ 3709bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3710bef8e0ddSBarry Smith in the matrix. 3711bef8e0ddSBarry Smith 3712bef8e0ddSBarry Smith Input Parameters: 371311a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3714bef8e0ddSBarry Smith - indices - the column indices 3715bef8e0ddSBarry Smith 371615091d37SBarry Smith Level: advanced 371715091d37SBarry Smith 3718bef8e0ddSBarry Smith Notes: 3719bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3720bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 372111a5261eSBarry Smith of the `MatSetValues()` operation. 3722bef8e0ddSBarry Smith 3723bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 372411a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3725bef8e0ddSBarry Smith 372611a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3727bef8e0ddSBarry Smith 3728b9617806SBarry Smith The indices should start with zero, not one. 3729b9617806SBarry Smith 37301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3731bef8e0ddSBarry Smith @*/ 3732d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3733d71ae5a4SJacob Faibussowitsch { 3734bef8e0ddSBarry Smith PetscFunctionBegin; 37350700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37364f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3737cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3739bef8e0ddSBarry Smith } 3740bef8e0ddSBarry Smith 3741ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3742d71ae5a4SJacob Faibussowitsch { 3743be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3744d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3745be6bf707SBarry Smith 3746be6bf707SBarry Smith PetscFunctionBegin; 374728b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3748be6bf707SBarry Smith 3749be6bf707SBarry Smith /* allocate space for values if not already there */ 37504dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3751be6bf707SBarry Smith 3752be6bf707SBarry Smith /* copy values over */ 37539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3755be6bf707SBarry Smith } 3756be6bf707SBarry Smith 3757be6bf707SBarry Smith /*@ 375820f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3759be6bf707SBarry Smith nonlinear portion. 3760be6bf707SBarry Smith 3761c3339decSBarry Smith Logically Collect 3762be6bf707SBarry Smith 376327430b45SBarry Smith Input Parameter: 376411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3765be6bf707SBarry Smith 376615091d37SBarry Smith Level: advanced 376715091d37SBarry Smith 37682920cce0SJacob Faibussowitsch Example Usage: 376927430b45SBarry Smith .vb 37702ef1f0ffSBarry Smith Using SNES 377127430b45SBarry Smith Create Jacobian matrix 377227430b45SBarry Smith Set linear terms into matrix 377327430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 377427430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 377527430b45SBarry Smith boundary conditions again will not change the nonzero structure 377627430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377727430b45SBarry Smith MatStoreValues(mat); 377827430b45SBarry Smith Call SNESSetJacobian() with matrix 377927430b45SBarry Smith In your Jacobian routine 378027430b45SBarry Smith MatRetrieveValues(mat); 378127430b45SBarry Smith Set nonlinear terms in matrix 3782be6bf707SBarry Smith 378327430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 378427430b45SBarry Smith // build linear portion of Jacobian 378527430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378627430b45SBarry Smith MatStoreValues(mat); 378727430b45SBarry Smith loop over nonlinear iterations 378827430b45SBarry Smith MatRetrieveValues(mat); 378927430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 379027430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 379127430b45SBarry Smith Solve linear system with Jacobian 379227430b45SBarry Smith endloop 379327430b45SBarry Smith .ve 3794be6bf707SBarry Smith 3795be6bf707SBarry Smith Notes: 3796da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 379711a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3798be6bf707SBarry Smith calling this routine. 3799be6bf707SBarry Smith 38000c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 38010c468ba9SBarry Smith and does not allocated additional space. 38020c468ba9SBarry Smith 3803fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3804be6bf707SBarry Smith @*/ 3805d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3806d71ae5a4SJacob Faibussowitsch { 3807be6bf707SBarry Smith PetscFunctionBegin; 38080700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 380928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 381028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3811cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3813be6bf707SBarry Smith } 3814be6bf707SBarry Smith 3815ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3816d71ae5a4SJacob Faibussowitsch { 3817be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3818d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3819be6bf707SBarry Smith 3820be6bf707SBarry Smith PetscFunctionBegin; 382128b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 382228b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3823be6bf707SBarry Smith /* copy values over */ 38249566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3826be6bf707SBarry Smith } 3827be6bf707SBarry Smith 3828be6bf707SBarry Smith /*@ 382920f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3830be6bf707SBarry Smith 3831c3339decSBarry Smith Logically Collect 3832be6bf707SBarry Smith 38332fe279fdSBarry Smith Input Parameter: 383411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3835be6bf707SBarry Smith 383615091d37SBarry Smith Level: advanced 383715091d37SBarry Smith 38381cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3839be6bf707SBarry Smith @*/ 3840d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3841d71ae5a4SJacob Faibussowitsch { 3842be6bf707SBarry Smith PetscFunctionBegin; 38430700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 384428b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 384528b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3846cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3848be6bf707SBarry Smith } 3849be6bf707SBarry Smith 38505d83a8b1SBarry Smith /*@ 385111a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38520d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 385320f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 385420f4b53cSBarry Smith (or the array `nnz`). 385517ab2063SBarry Smith 3856d083f849SBarry Smith Collective 3857db81eaa0SLois Curfman McInnes 385817ab2063SBarry Smith Input Parameters: 385911a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 386017ab2063SBarry Smith . m - number of rows 386117ab2063SBarry Smith . n - number of columns 386217ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 386351c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38640298fd71SBarry Smith (possibly different for each row) or NULL 386517ab2063SBarry Smith 386617ab2063SBarry Smith Output Parameter: 3867416022c9SBarry Smith . A - the matrix 386817ab2063SBarry Smith 38692ef1f0ffSBarry Smith Options Database Keys: 38702ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38712ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38722ef1f0ffSBarry Smith 38732ef1f0ffSBarry Smith Level: intermediate 3874175b88e8SBarry Smith 3875b259b22eSLois Curfman McInnes Notes: 387677433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 387777433607SBarry Smith 38782ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 387949a6f317SBarry Smith 38802ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38812ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38820002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38832ef1f0ffSBarry Smith either one (as in Fortran) or zero. 388417ab2063SBarry Smith 388520f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38862ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 388720f4b53cSBarry Smith allocation. 388817ab2063SBarry Smith 3889682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38904fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3891682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38926c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38936c7ebb05SLois Curfman McInnes 38941cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 389517ab2063SBarry Smith @*/ 3896d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3897d71ae5a4SJacob Faibussowitsch { 38983a40ed3dSBarry Smith PetscFunctionBegin; 38999566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 39009566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 39019566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 39029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 39033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3904273d9f13SBarry Smith } 3905273d9f13SBarry Smith 39065d83a8b1SBarry Smith /*@ 3907273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3908273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3909273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3910273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3911273d9f13SBarry Smith 3912d083f849SBarry Smith Collective 3913273d9f13SBarry Smith 3914273d9f13SBarry Smith Input Parameters: 39151c4f3114SJed Brown + B - The matrix 3916273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3917273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39180298fd71SBarry Smith (possibly different for each row) or NULL 3919273d9f13SBarry Smith 39202ef1f0ffSBarry Smith Options Database Keys: 39212ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39222ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39232ef1f0ffSBarry Smith 39242ef1f0ffSBarry Smith Level: intermediate 39252ef1f0ffSBarry Smith 3926273d9f13SBarry Smith Notes: 39272ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 392849a6f317SBarry Smith 392911a5261eSBarry Smith The `MATSEQAIJ` format also called 39302ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3931273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3932273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3933273d9f13SBarry Smith 39342ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39352ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39362ef1f0ffSBarry Smith allocation. 3937273d9f13SBarry Smith 393811a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3939aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3940aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3941aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3942aa95bbe8SBarry Smith 394311a5261eSBarry Smith Developer Notes: 394411a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3945a96a251dSBarry Smith entries or columns indices 3946a96a251dSBarry Smith 3947273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3948273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3949273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3950273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3951273d9f13SBarry Smith 39521cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3953db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3954273d9f13SBarry Smith @*/ 3955d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3956d71ae5a4SJacob Faibussowitsch { 3957a23d5eceSKris Buschelman PetscFunctionBegin; 39586ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39596ba663aaSJed Brown PetscValidType(B, 1); 3960cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3962a23d5eceSKris Buschelman } 3963a23d5eceSKris Buschelman 3964d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3965d71ae5a4SJacob Faibussowitsch { 3966ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39672576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 396897f1f81fSBarry Smith PetscInt i; 3969273d9f13SBarry Smith 3970273d9f13SBarry Smith PetscFunctionBegin; 3971ad79cf63SBarry Smith if (B->hash_active) { 3972aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3973ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3974ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3975ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3976ad79cf63SBarry Smith } 39772576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3978a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3979c461c341SBarry Smith skipallocation = PETSC_TRUE; 3980c461c341SBarry Smith nz = 0; 3981c461c341SBarry Smith } 39829566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39839566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3984899cda47SBarry Smith 3985435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 398608401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 39879f0612e4SBarry Smith if (nnz) { 3988d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 398908401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 399008401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3991b73539f3SBarry Smith } 3992b73539f3SBarry Smith } 3993b73539f3SBarry Smith 3994273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3995ab93d7beSBarry Smith if (!skipallocation) { 39964dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3997071fcb05SBarry Smith if (!b->ilen) { 3998071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39999566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 4000071fcb05SBarry Smith } else { 40019566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 40022ee49352SLisandro Dalcin } 4003aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 4004273d9f13SBarry Smith if (!nnz) { 4005435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4006c62bd62aSJed Brown else if (nz < 0) nz = 1; 40075d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4008d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4009c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4010273d9f13SBarry Smith } else { 4011c73702f5SBarry Smith PetscInt64 nz64 = 0; 40129371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40139371c9d4SSatish Balay b->imax[i] = nnz[i]; 40149371c9d4SSatish Balay nz64 += nnz[i]; 40159371c9d4SSatish Balay } 40169566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4017273d9f13SBarry Smith } 4018ab93d7beSBarry Smith 4019273d9f13SBarry Smith /* allocate the matrix space */ 40209566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 40219f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 40229f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 40239f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 4024396832f4SHong Zhang if (B->structure_only) { 40259f0612e4SBarry Smith b->free_a = PETSC_FALSE; 4026396832f4SHong Zhang } else { 40279f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 40289f0612e4SBarry Smith b->free_a = PETSC_TRUE; 4029396832f4SHong Zhang } 4030bfeeae90SHong Zhang b->i[0] = 0; 4031ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4032c461c341SBarry Smith } else { 4033e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4034e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4035c461c341SBarry Smith } 4036273d9f13SBarry Smith 4037846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4038846b4da1SFande Kong /* reserve user-requested sparsity */ 40399566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4040846b4da1SFande Kong } 4041846b4da1SFande Kong 4042273d9f13SBarry Smith b->nz = 0; 4043273d9f13SBarry Smith b->maxnz = nz; 4044273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40451baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4046cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4047cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40485519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40495519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40505519a089SJose E. Roman */ 40515519a089SJose E. Roman B->nonzerostate++; 40523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4053273d9f13SBarry Smith } 4054273d9f13SBarry Smith 4055ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4056d71ae5a4SJacob Faibussowitsch { 4057846b4da1SFande Kong Mat_SeqAIJ *a; 4058a5bbaf83SFande Kong PetscInt i; 40591f14be2bSBarry Smith PetscBool skipreset; 4060846b4da1SFande Kong 4061846b4da1SFande Kong PetscFunctionBegin; 4062846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 406314d0e64fSAlex Lindsay 406414d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40653ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 406614d0e64fSAlex Lindsay 4067846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40682c814fdeSFande Kong /* if no saved info, we error out */ 406928b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40702c814fdeSFande Kong 40711f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40722c814fdeSFande Kong 40731f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40741f14be2bSBarry Smith if (!skipreset) { 40759566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40769566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4077846b4da1SFande Kong a->i[0] = 0; 4078ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4079846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4080846b4da1SFande Kong a->nz = 0; 4081846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4082846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4083846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4084846b4da1SFande Kong A->assembled = PETSC_FALSE; 40851f14be2bSBarry Smith } 40863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4087846b4da1SFande Kong } 4088846b4da1SFande Kong 408958d36128SBarry Smith /*@ 409011a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4091a1661176SMatthew Knepley 4092a1661176SMatthew Knepley Input Parameters: 4093a1661176SMatthew Knepley + B - the matrix 4094d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4095d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4096d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4097a1661176SMatthew Knepley 4098a1661176SMatthew Knepley Level: developer 4099a1661176SMatthew Knepley 41006a9b8d82SBarry Smith Notes: 41012ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 410258d36128SBarry Smith 41036a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41046a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41056a9b8d82SBarry Smith 41066a9b8d82SBarry Smith Developer Notes: 41072ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41082ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41096a9b8d82SBarry Smith 411011a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41116a9b8d82SBarry Smith 4112fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4113a1661176SMatthew Knepley @*/ 4114d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4115d71ae5a4SJacob Faibussowitsch { 4116a1661176SMatthew Knepley PetscFunctionBegin; 41170700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41186ba663aaSJed Brown PetscValidType(B, 1); 4119cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4121a1661176SMatthew Knepley } 4122a1661176SMatthew Knepley 4123ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4124d71ae5a4SJacob Faibussowitsch { 4125a1661176SMatthew Knepley PetscInt i; 4126a1661176SMatthew Knepley PetscInt m, n; 4127a1661176SMatthew Knepley PetscInt nz; 41286a9b8d82SBarry Smith PetscInt *nnz; 4129a1661176SMatthew Knepley 4130a1661176SMatthew Knepley PetscFunctionBegin; 4131aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4132779a8d59SSatish Balay 41339566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41349566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4135779a8d59SSatish Balay 41369566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4138a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4139b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 414008401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4141a1661176SMatthew Knepley nnz[i] = nz; 4142a1661176SMatthew Knepley } 41439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41449566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4145a1661176SMatthew Knepley 41468e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4147a1661176SMatthew Knepley 41489566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4150a1661176SMatthew Knepley 41519566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4153a1661176SMatthew Knepley } 4154a1661176SMatthew Knepley 4155ad7e164aSPierre Jolivet /*@ 41562ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4157ad7e164aSPierre Jolivet 4158ad7e164aSPierre Jolivet Input Parameters: 4159ad7e164aSPierre Jolivet + A - left-hand side matrix 4160ad7e164aSPierre Jolivet . B - right-hand side matrix 416111a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4162ad7e164aSPierre Jolivet 4163ad7e164aSPierre Jolivet Output Parameter: 41642ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4165ad7e164aSPierre Jolivet 4166ad7e164aSPierre Jolivet Level: intermediate 4167ad7e164aSPierre Jolivet 416811a5261eSBarry Smith Note: 416911a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4170ad7e164aSPierre Jolivet 41711cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4172ad7e164aSPierre Jolivet @*/ 4173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4174d71ae5a4SJacob Faibussowitsch { 4175ad7e164aSPierre Jolivet PetscFunctionBegin; 4176ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4177ad7e164aSPierre Jolivet PetscValidType(A, 1); 4178ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4179ad7e164aSPierre Jolivet PetscValidType(B, 2); 41804f572ea9SToby Isaac PetscAssertPointer(C, 4); 4181ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4182ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4183ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4184ad7e164aSPierre Jolivet } 4185cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4187ad7e164aSPierre Jolivet } 4188ad7e164aSPierre Jolivet 4189ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4190d71ae5a4SJacob Faibussowitsch { 4191ad7e164aSPierre Jolivet Mat newmat; 4192ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4193ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4194ad7e164aSPierre Jolivet PetscScalar *v; 4195fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4196ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4197ad7e164aSPierre Jolivet PetscBool flg; 4198ad7e164aSPierre Jolivet 4199ad7e164aSPierre Jolivet PetscFunctionBegin; 420028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420128b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 420228b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 420328b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42049566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 420528b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4206aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4207ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42089566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42099566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42119566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4212ad7e164aSPierre Jolivet i[0] = 0; 4213ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4214ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4215ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4216ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4217ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4218ad7e164aSPierre Jolivet } 4219ad7e164aSPierre Jolivet } 4220ad7e164aSPierre Jolivet } 42219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4222ad7e164aSPierre Jolivet *C = newmat; 42239566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4224ad7e164aSPierre Jolivet nnz = 0; 4225ad7e164aSPierre Jolivet } 42269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4229ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4230ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4231ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4232ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4233ad7e164aSPierre Jolivet } 4234ad7e164aSPierre Jolivet } 4235ad7e164aSPierre Jolivet } 42369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4240ad7e164aSPierre Jolivet } 4241ad7e164aSPierre Jolivet 4242c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4243af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4244170fe5c8SBarry Smith 4245170fe5c8SBarry Smith /* 4246170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4247170fe5c8SBarry Smith 4248170fe5c8SBarry Smith n p p 42492da392ccSBarry Smith [ ] [ ] [ ] 42502da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42512da392ccSBarry Smith [ ] [ ] [ ] 4252170fe5c8SBarry Smith 4253170fe5c8SBarry Smith */ 4254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4255d71ae5a4SJacob Faibussowitsch { 4256170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4257170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4258170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 425986214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4260170fe5c8SBarry Smith const PetscInt *ii, *idx; 4261170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4262170fe5c8SBarry Smith PetscScalar *c, *c_q; 426386214ceeSStefano Zampini PetscInt clda = sub_c->lda; 426486214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4265170fe5c8SBarry Smith 4266170fe5c8SBarry Smith PetscFunctionBegin; 4267d0f46423SBarry Smith m = A->rmap->n; 4268d0f46423SBarry Smith n = A->cmap->n; 4269d0f46423SBarry Smith p = B->cmap->n; 4270170fe5c8SBarry Smith a = sub_a->v; 4271170fe5c8SBarry Smith b = sub_b->a; 4272170fe5c8SBarry Smith c = sub_c->v; 427386214ceeSStefano Zampini if (clda == m) { 42749566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 427586214ceeSStefano Zampini } else { 427686214ceeSStefano Zampini for (j = 0; j < p; j++) 42779371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 427886214ceeSStefano Zampini } 4279170fe5c8SBarry Smith ii = sub_b->i; 4280170fe5c8SBarry Smith idx = sub_b->j; 4281170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4282170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4283170fe5c8SBarry Smith while (q-- > 0) { 428486214ceeSStefano Zampini c_q = c + clda * (*idx); 428586214ceeSStefano Zampini a_q = a + alda * i; 4286854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4287170fe5c8SBarry Smith idx++; 4288170fe5c8SBarry Smith b++; 4289170fe5c8SBarry Smith } 4290170fe5c8SBarry Smith } 42913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4292170fe5c8SBarry Smith } 4293170fe5c8SBarry Smith 4294d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4295d71ae5a4SJacob Faibussowitsch { 4296d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 429786214ceeSStefano Zampini PetscBool cisdense; 4298170fe5c8SBarry Smith 4299170fe5c8SBarry Smith PetscFunctionBegin; 430008401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43019566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43029566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4303d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 430448a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43059566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4306d73949e8SHong Zhang 43074222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4309170fe5c8SBarry Smith } 4310170fe5c8SBarry Smith 43110bad9183SKris Buschelman /*MC 4312fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43130bad9183SKris Buschelman based on compressed sparse row format. 43140bad9183SKris Buschelman 43152ef1f0ffSBarry Smith Options Database Key: 43160bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43170bad9183SKris Buschelman 43180bad9183SKris Buschelman Level: beginner 43190bad9183SKris Buschelman 43200cd7f59aSBarry Smith Notes: 43212ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43220cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43230cd7f59aSBarry Smith in the matrix 43240cd7f59aSBarry Smith 432511a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 432611a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43270cd7f59aSBarry Smith 432811a5261eSBarry Smith Developer Note: 43292ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43300cd7f59aSBarry Smith 43311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43320bad9183SKris Buschelman M*/ 43330bad9183SKris Buschelman 4334ccd284c7SBarry Smith /*MC 4335ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4336ccd284c7SBarry Smith 433711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 433811a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 433911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4340ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4341ccd284c7SBarry Smith the above preallocation routines for simplicity. 4342ccd284c7SBarry Smith 43432ef1f0ffSBarry Smith Options Database Key: 434411a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4345ccd284c7SBarry Smith 43462ef1f0ffSBarry Smith Level: beginner 43472ef1f0ffSBarry Smith 434811a5261eSBarry Smith Note: 434911a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4350ccd284c7SBarry Smith enough exist. 4351ccd284c7SBarry Smith 43521cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4353ccd284c7SBarry Smith M*/ 4354ccd284c7SBarry Smith 4355ccd284c7SBarry Smith /*MC 4356ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4357ccd284c7SBarry Smith 43582ef1f0ffSBarry Smith Options Database Key: 43592ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43602ef1f0ffSBarry Smith 43612ef1f0ffSBarry Smith Level: beginner 43622ef1f0ffSBarry Smith 43632ef1f0ffSBarry Smith Note: 436411a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 436511a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 436611a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4367ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4368ccd284c7SBarry Smith the above preallocation routines for simplicity. 4369ccd284c7SBarry Smith 43701cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4371ccd284c7SBarry Smith M*/ 4372ccd284c7SBarry Smith 43737906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43747906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43757906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43767906f579SHong Zhang #endif 4377d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4378d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4379d24d4204SJose E. Roman #endif 43807906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43817906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43827906f579SHong Zhang #endif 43837906f579SHong Zhang 4384d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4385c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43864222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43877906f579SHong Zhang 43888c778c55SBarry Smith /*@C 438911a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43908c778c55SBarry Smith 43918c778c55SBarry Smith Not Collective 43928c778c55SBarry Smith 43938c778c55SBarry Smith Input Parameter: 4394fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43958c778c55SBarry Smith 43968c778c55SBarry Smith Output Parameter: 43978c778c55SBarry Smith . array - pointer to the data 43988c778c55SBarry Smith 43998c778c55SBarry Smith Level: intermediate 44008c778c55SBarry Smith 4401fe59aa6dSJacob Faibussowitsch Fortran Notes: 44020ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44030ab4885dSBarry Smith 44041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44058c778c55SBarry Smith @*/ 44065d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4407d71ae5a4SJacob Faibussowitsch { 4408d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44098c778c55SBarry Smith 44108c778c55SBarry Smith PetscFunctionBegin; 4411d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44129566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4413d67d9f35SJunchao Zhang } else { 4414d67d9f35SJunchao Zhang *array = aij->a; 4415d67d9f35SJunchao Zhang } 44163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4417d67d9f35SJunchao Zhang } 4418d67d9f35SJunchao Zhang 4419d67d9f35SJunchao Zhang /*@C 442011a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4421d67d9f35SJunchao Zhang 4422d67d9f35SJunchao Zhang Not Collective 4423d67d9f35SJunchao Zhang 4424d67d9f35SJunchao Zhang Input Parameters: 4425fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4426d67d9f35SJunchao Zhang - array - pointer to the data 4427d67d9f35SJunchao Zhang 4428d67d9f35SJunchao Zhang Level: intermediate 4429d67d9f35SJunchao Zhang 4430fe59aa6dSJacob Faibussowitsch Fortran Notes: 44310ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44320ab4885dSBarry Smith 44331cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4434d67d9f35SJunchao Zhang @*/ 44355d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4436d71ae5a4SJacob Faibussowitsch { 4437d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4438d67d9f35SJunchao Zhang 4439d67d9f35SJunchao Zhang PetscFunctionBegin; 4440d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44419566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4442d67d9f35SJunchao Zhang } else { 4443d67d9f35SJunchao Zhang *array = NULL; 4444d67d9f35SJunchao Zhang } 44459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44469566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44488c778c55SBarry Smith } 44498c778c55SBarry Smith 445021e72a00SBarry Smith /*@C 445111a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44528f1ea47aSStefano Zampini 44530ab4885dSBarry Smith Not Collective; No Fortran Support 44548f1ea47aSStefano Zampini 44558f1ea47aSStefano Zampini Input Parameter: 4456fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44578f1ea47aSStefano Zampini 44588f1ea47aSStefano Zampini Output Parameter: 44598f1ea47aSStefano Zampini . array - pointer to the data 44608f1ea47aSStefano Zampini 44618f1ea47aSStefano Zampini Level: intermediate 44628f1ea47aSStefano Zampini 44631cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44648f1ea47aSStefano Zampini @*/ 44655d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4466d71ae5a4SJacob Faibussowitsch { 4467d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44688f1ea47aSStefano Zampini 44698f1ea47aSStefano Zampini PetscFunctionBegin; 4470d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44719566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4472d67d9f35SJunchao Zhang } else { 4473d67d9f35SJunchao Zhang *array = aij->a; 4474d67d9f35SJunchao Zhang } 44753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44768f1ea47aSStefano Zampini } 44778f1ea47aSStefano Zampini 44788f1ea47aSStefano Zampini /*@C 447911a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44808f1ea47aSStefano Zampini 44810ab4885dSBarry Smith Not Collective; No Fortran Support 44828f1ea47aSStefano Zampini 44838f1ea47aSStefano Zampini Input Parameter: 4484fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44858f1ea47aSStefano Zampini 44868f1ea47aSStefano Zampini Output Parameter: 44878f1ea47aSStefano Zampini . array - pointer to the data 44888f1ea47aSStefano Zampini 44898f1ea47aSStefano Zampini Level: intermediate 44908f1ea47aSStefano Zampini 44911cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44928f1ea47aSStefano Zampini @*/ 44935d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4494d71ae5a4SJacob Faibussowitsch { 4495d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44968f1ea47aSStefano Zampini 44978f1ea47aSStefano Zampini PetscFunctionBegin; 4498d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44999566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4500d67d9f35SJunchao Zhang } else { 4501d67d9f35SJunchao Zhang *array = NULL; 4502d67d9f35SJunchao Zhang } 45033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4504d67d9f35SJunchao Zhang } 4505d67d9f35SJunchao Zhang 4506d67d9f35SJunchao Zhang /*@C 450711a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4508d67d9f35SJunchao Zhang 45090ab4885dSBarry Smith Not Collective; No Fortran Support 4510d67d9f35SJunchao Zhang 4511d67d9f35SJunchao Zhang Input Parameter: 4512fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4513d67d9f35SJunchao Zhang 4514d67d9f35SJunchao Zhang Output Parameter: 4515d67d9f35SJunchao Zhang . array - pointer to the data 4516d67d9f35SJunchao Zhang 4517d67d9f35SJunchao Zhang Level: intermediate 4518d67d9f35SJunchao Zhang 45191cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4520d67d9f35SJunchao Zhang @*/ 45215d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4522d71ae5a4SJacob Faibussowitsch { 4523d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4524d67d9f35SJunchao Zhang 4525d67d9f35SJunchao Zhang PetscFunctionBegin; 4526d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45279566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4528d67d9f35SJunchao Zhang } else { 4529d67d9f35SJunchao Zhang *array = aij->a; 4530d67d9f35SJunchao Zhang } 45319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45329566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4534d67d9f35SJunchao Zhang } 4535d67d9f35SJunchao Zhang 4536d67d9f35SJunchao Zhang /*@C 4537d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4538d67d9f35SJunchao Zhang 45390ab4885dSBarry Smith Not Collective; No Fortran Support 4540d67d9f35SJunchao Zhang 4541d67d9f35SJunchao Zhang Input Parameter: 4542fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4543d67d9f35SJunchao Zhang 4544d67d9f35SJunchao Zhang Output Parameter: 4545d67d9f35SJunchao Zhang . array - pointer to the data 4546d67d9f35SJunchao Zhang 4547d67d9f35SJunchao Zhang Level: intermediate 4548d67d9f35SJunchao Zhang 45491cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4550d67d9f35SJunchao Zhang @*/ 45515d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4552d71ae5a4SJacob Faibussowitsch { 4553d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4554d67d9f35SJunchao Zhang 4555d67d9f35SJunchao Zhang PetscFunctionBegin; 4556d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45579566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4558d67d9f35SJunchao Zhang } else { 4559d67d9f35SJunchao Zhang *array = NULL; 4560d67d9f35SJunchao Zhang } 45613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45628f1ea47aSStefano Zampini } 45638f1ea47aSStefano Zampini 45648f1ea47aSStefano Zampini /*@C 456511a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45667ee59b9bSJunchao Zhang 45670ab4885dSBarry Smith Not Collective; No Fortran Support 45687ee59b9bSJunchao Zhang 45697ee59b9bSJunchao Zhang Input Parameter: 457011a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45717ee59b9bSJunchao Zhang 45727ee59b9bSJunchao Zhang Output Parameters: 45737ee59b9bSJunchao Zhang + i - row map array of the matrix 45747ee59b9bSJunchao Zhang . j - column index array of the matrix 45757ee59b9bSJunchao Zhang . a - data array of the matrix 4576fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45777ee59b9bSJunchao Zhang 4578fe59aa6dSJacob Faibussowitsch Level: developer 45792ef1f0ffSBarry Smith 45807ee59b9bSJunchao Zhang Notes: 45812ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45827ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45837ee59b9bSJunchao Zhang 45847ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45852ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45867ee59b9bSJunchao Zhang 45871cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45887ee59b9bSJunchao Zhang @*/ 45895d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4590d71ae5a4SJacob Faibussowitsch { 45917ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45927ee59b9bSJunchao Zhang 45937ee59b9bSJunchao Zhang PetscFunctionBegin; 45947ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45957ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45967ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45977ee59b9bSJunchao Zhang } else { 45987ee59b9bSJunchao Zhang if (i) *i = aij->i; 45997ee59b9bSJunchao Zhang if (j) *j = aij->j; 46007ee59b9bSJunchao Zhang if (a) *a = aij->a; 46017ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46027ee59b9bSJunchao Zhang } 46033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46047ee59b9bSJunchao Zhang } 46057ee59b9bSJunchao Zhang 4606cc4c1da9SBarry Smith /*@ 460721e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 460821e72a00SBarry Smith 460921e72a00SBarry Smith Not Collective 461021e72a00SBarry Smith 461121e72a00SBarry Smith Input Parameter: 4612fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 461321e72a00SBarry Smith 461421e72a00SBarry Smith Output Parameter: 461521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 461621e72a00SBarry Smith 461721e72a00SBarry Smith Level: intermediate 461821e72a00SBarry Smith 46191cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 462021e72a00SBarry Smith @*/ 4621d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4622d71ae5a4SJacob Faibussowitsch { 462321e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 462421e72a00SBarry Smith 462521e72a00SBarry Smith PetscFunctionBegin; 462621e72a00SBarry Smith *nz = aij->rmax; 46273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 462821e72a00SBarry Smith } 462921e72a00SBarry Smith 463049abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data) 46312c4ab24aSJunchao Zhang { 463249abdd8aSBarry Smith MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data; 46334d86920dSPierre Jolivet 46342c4ab24aSJunchao Zhang PetscFunctionBegin; 46352c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46362c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46372c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46382c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46392c4ab24aSJunchao Zhang } 46402c4ab24aSJunchao Zhang 4641d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4642d71ae5a4SJacob Faibussowitsch { 4643394ed5ebSJunchao Zhang MPI_Comm comm; 4644394ed5ebSJunchao Zhang PetscInt *i, *j; 46450d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4646394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4647394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4648394ed5ebSJunchao Zhang PetscInt *Aj; 4649394ed5ebSJunchao Zhang PetscScalar *Aa; 4650f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4651cbc6b225SStefano Zampini MatType rtype; 4652394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46532c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46540d88f7f4SJunchao Zhang PetscBool isorted; 46559f0612e4SBarry Smith PetscBool hypre; 46569f0612e4SBarry Smith const char *name; 4657394ed5ebSJunchao Zhang 4658394ed5ebSJunchao Zhang PetscFunctionBegin; 46599566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46609566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4661e8729f6fSJunchao Zhang i = coo_i; 4662e8729f6fSJunchao Zhang j = coo_j; 46639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46640d88f7f4SJunchao Zhang 46650d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46660d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46670d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46680d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4669394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46700d88f7f4SJunchao Zhang if (isorted) { 46710d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46720d88f7f4SJunchao Zhang else iprev = i[k]; 46730d88f7f4SJunchao Zhang } 4674394ed5ebSJunchao Zhang perm[k] = k; 4675394ed5ebSJunchao Zhang } 4676394ed5ebSJunchao Zhang 46770d88f7f4SJunchao Zhang /* Sort by row if not already */ 46780d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4679651b1cf9SStefano Zampini 4680651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4681651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46829371c9d4SSatish Balay if (i[k] >= 0) break; 4683394ed5ebSJunchao Zhang nneg = k; 46849566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4685394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 468635cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4687394ed5ebSJunchao Zhang 46889f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 46899f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 46909f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4691394ed5ebSJunchao Zhang 4692651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4693651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4694651b1cf9SStefano Zampini 4695394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 469635cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4697394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4698394ed5ebSJunchao Zhang while (k < coo_n) { 46990d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47000d88f7f4SJunchao Zhang PetscInt jprev; 47010d88f7f4SJunchao Zhang 47020d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4703394ed5ebSJunchao Zhang row = i[k]; 47040d88f7f4SJunchao Zhang start = k; 47050d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47060d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47070d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47080d88f7f4SJunchao Zhang if (strictly_sorted) { 47090d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47100d88f7f4SJunchao Zhang else jprev = j[k]; 47110d88f7f4SJunchao Zhang } 47120d88f7f4SJunchao Zhang k++; 47130d88f7f4SJunchao Zhang } 4714394ed5ebSJunchao Zhang end = k; 47150d88f7f4SJunchao Zhang 4716651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4717651b1cf9SStefano Zampini if (hypre) { 47181690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4719651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47200d88f7f4SJunchao Zhang 47210d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47220d88f7f4SJunchao Zhang PetscCount tmp; 47230d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47240d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47251c265611SJunchao Zhang j[p] = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[]) 47260d88f7f4SJunchao Zhang j[start] = row; 47270d88f7f4SJunchao Zhang tmp = perm[start]; 47281c265611SJunchao Zhang perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below 47290d88f7f4SJunchao Zhang perm[p] = tmp; 47300d88f7f4SJunchao Zhang break; 47310d88f7f4SJunchao Zhang } 47320d88f7f4SJunchao Zhang } 47330d88f7f4SJunchao Zhang } else { 4734651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4735651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4736651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4737651b1cf9SStefano Zampini } 47380d88f7f4SJunchao Zhang 4739651b1cf9SStefano Zampini if (hasdiag) { 4740651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4741651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4742651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4743651b1cf9SStefano Zampini } 4744651b1cf9SStefano Zampini } 4745651b1cf9SStefano Zampini } 47460d88f7f4SJunchao Zhang } 47471c265611SJunchao Zhang // sort by columns in a row. perm[] indicates their original order 47480d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4749651b1cf9SStefano Zampini 47500d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47510d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47520d88f7f4SJunchao Zhang Aj[q] = j[p]; 47530d88f7f4SJunchao Zhang jmap[q] = 1; 47540d88f7f4SJunchao Zhang } 47556497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 47560d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47570d88f7f4SJunchao Zhang } else { 4758394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4759394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4760651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4761394ed5ebSJunchao Zhang Ai[row] = 1; 4762394ed5ebSJunchao Zhang nnz++; 4763394ed5ebSJunchao Zhang 4764394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4765394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4766394ed5ebSJunchao Zhang q++; 4767394ed5ebSJunchao Zhang jmap[q] = 1; 4768394ed5ebSJunchao Zhang Aj[q] = j[p]; 4769394ed5ebSJunchao Zhang Ai[row]++; 4770394ed5ebSJunchao Zhang nnz++; 4771394ed5ebSJunchao Zhang } else { 4772394ed5ebSJunchao Zhang jmap[q]++; 4773394ed5ebSJunchao Zhang } 4774394ed5ebSJunchao Zhang } 4775394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4776394ed5ebSJunchao Zhang } 47770d88f7f4SJunchao Zhang } 47780d88f7f4SJunchao Zhang 4779394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4780394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47810d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4782394ed5ebSJunchao Zhang jmap[0] = 0; 4783394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47840d88f7f4SJunchao Zhang 47859f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4786394ed5ebSJunchao Zhang PetscCount *jmap_new; 4787394ed5ebSJunchao Zhang PetscInt *Aj_new; 4788394ed5ebSJunchao Zhang 47899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47919566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4792394ed5ebSJunchao Zhang jmap = jmap_new; 4793394ed5ebSJunchao Zhang 47949f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 47959566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47969f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4797394ed5ebSJunchao Zhang Aj = Aj_new; 4798394ed5ebSJunchao Zhang } 4799394ed5ebSJunchao Zhang 4800394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4801394ed5ebSJunchao Zhang PetscCount *perm_new; 4802cbc6b225SStefano Zampini 48039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48049566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48059566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4806394ed5ebSJunchao Zhang perm = perm_new; 4807394ed5ebSJunchao Zhang } 4808394ed5ebSJunchao Zhang 48099566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48109f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 48119f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 48129566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4813394ed5ebSJunchao Zhang 4814394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48152c4ab24aSJunchao Zhang 48162c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48172c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48186497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 48192c4ab24aSJunchao Zhang coo->n = coo_n; 48202c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48212c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48222c4ab24aSJunchao Zhang coo->perm = perm; 482303e76207SPierre Jolivet PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ)); 48243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4825394ed5ebSJunchao Zhang } 4826394ed5ebSJunchao Zhang 4827d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4828d71ae5a4SJacob Faibussowitsch { 4829394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4830394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48312c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4832394ed5ebSJunchao Zhang PetscScalar *Aa; 48332c4ab24aSJunchao Zhang PetscContainer container; 48342c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4835394ed5ebSJunchao Zhang 4836394ed5ebSJunchao Zhang PetscFunctionBegin; 48372c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48382c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48392c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48402c4ab24aSJunchao Zhang perm = coo->perm; 48412c4ab24aSJunchao Zhang jmap = coo->jmap; 48429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4843394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4844b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4845b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4846b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4847394ed5ebSJunchao Zhang } 48489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4850394ed5ebSJunchao Zhang } 4851394ed5ebSJunchao Zhang 485234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48535063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 485402fe1965SBarry Smith #endif 4855d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4856d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4857d5e393b6SSuyash Tandon #endif 48583d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48595063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48603d0639e7SStefano Zampini #endif 486102fe1965SBarry Smith 4862d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4863d71ae5a4SJacob Faibussowitsch { 4864273d9f13SBarry Smith Mat_SeqAIJ *b; 486538baddfdSBarry Smith PetscMPIInt size; 4866273d9f13SBarry Smith 4867273d9f13SBarry Smith PetscFunctionBegin; 48689566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 486908401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4870273d9f13SBarry Smith 48714dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48722205254eSKarl Rupp 4873b0a32e0cSBarry Smith B->data = (void *)b; 4874aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4875071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48762205254eSKarl Rupp 4877f4259b30SLisandro Dalcin b->row = NULL; 4878f4259b30SLisandro Dalcin b->col = NULL; 4879f4259b30SLisandro Dalcin b->icol = NULL; 4880b810aeb4SBarry Smith b->reallocs = 0; 488136db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4882f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4883416022c9SBarry Smith b->nonew = 0; 4884f4259b30SLisandro Dalcin b->diag = NULL; 4885f4259b30SLisandro Dalcin b->solve_work = NULL; 4886f4259b30SLisandro Dalcin B->spptr = NULL; 4887f4259b30SLisandro Dalcin b->saved_values = NULL; 4888f4259b30SLisandro Dalcin b->idiag = NULL; 4889f4259b30SLisandro Dalcin b->mdiag = NULL; 4890f4259b30SLisandro Dalcin b->ssor_work = NULL; 489171f1c65dSBarry Smith b->omega = 1.0; 489271f1c65dSBarry Smith b->fshift = 0.0; 489371f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4894bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4895a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 489617ab2063SBarry Smith 48979566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4898d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4901b3866ffcSBarry Smith #endif 49029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49099779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4911191b95cbSRichard Tran Mills #endif 491234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 491602fe1965SBarry Smith #endif 4917d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4918d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4919d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4920d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4921d5e393b6SSuyash Tandon #endif 49223d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49243d0639e7SStefano Zampini #endif 49259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4926af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4928af8000cdSHong Zhang #endif 4929d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49309566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4931d24d4204SJose E. Roman #endif 493263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 493563c07aadSStefano Zampini #endif 49369566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49389566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 494014e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 4943674b392bSAlexander PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ)); 49449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49529566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49539566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 495617ab2063SBarry Smith } 495717ab2063SBarry Smith 4958b24902e0SBarry Smith /* 49593893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4960b24902e0SBarry Smith */ 4961d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4962d71ae5a4SJacob Faibussowitsch { 49632a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4964071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 496517ab2063SBarry Smith 49663a40ed3dSBarry Smith PetscFunctionBegin; 4967aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4968273d9f13SBarry Smith 4969d5f3da31SBarry Smith C->factortype = A->factortype; 4970f4259b30SLisandro Dalcin c->row = NULL; 4971f4259b30SLisandro Dalcin c->col = NULL; 4972f4259b30SLisandro Dalcin c->icol = NULL; 49736ad4291fSHong Zhang c->reallocs = 0; 4974bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 497517ab2063SBarry Smith 497669272f91SPierre Jolivet C->assembled = A->assembled; 497717ab2063SBarry Smith 497869272f91SPierre Jolivet if (A->preallocated) { 49799566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49809566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4981eec197d1SBarry Smith 498231fe6a7dSBarry Smith if (!A->hash_active) { 49839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49849566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49859566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 498717ab2063SBarry Smith 498817ab2063SBarry Smith /* allocate the matrix space */ 4989f77e22a1SHong Zhang if (mallocmatspace) { 49909f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 49919f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 49929f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 49939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 49949f0612e4SBarry Smith c->free_a = PETSC_TRUE; 49959f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 499617ab2063SBarry Smith if (m > 0) { 49979566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4998be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49992e5835c6SStefano Zampini const PetscScalar *aa; 50002e5835c6SStefano Zampini 50019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5004be6bf707SBarry Smith } else { 50059566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 500617ab2063SBarry Smith } 500708480c60SBarry Smith } 5008f77e22a1SHong Zhang } 500931fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 501031fe6a7dSBarry Smith } else { 501131fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 501231fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 501331fe6a7dSBarry Smith } 501417ab2063SBarry Smith 50156ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5016416022c9SBarry Smith c->roworiented = a->roworiented; 5017416022c9SBarry Smith c->nonew = a->nonew; 5018416022c9SBarry Smith if (a->diag) { 50199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50209566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5021071fcb05SBarry Smith } else c->diag = NULL; 50222205254eSKarl Rupp 5023f4259b30SLisandro Dalcin c->solve_work = NULL; 5024f4259b30SLisandro Dalcin c->saved_values = NULL; 5025f4259b30SLisandro Dalcin c->idiag = NULL; 5026f4259b30SLisandro Dalcin c->ssor_work = NULL; 5027a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 50286ad4291fSHong Zhang 5029893ad86cSHong Zhang c->rmax = a->rmax; 5030416022c9SBarry Smith c->nz = a->nz; 50318ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5032754ec7b1SSatish Balay 50336ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50346ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5035cd6b891eSBarry Smith if (a->compressedrow.use) { 50366ad4291fSHong Zhang i = a->compressedrow.nrows; 50379566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50399566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 504027ea64f8SHong Zhang } else { 504127ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50420298fd71SBarry Smith c->compressedrow.i = NULL; 50430298fd71SBarry Smith c->compressedrow.rindex = NULL; 50446ad4291fSHong Zhang } 5045ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5046e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50474846f1f5SKris Buschelman 50489566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 504969272f91SPierre Jolivet } 50509566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 505217ab2063SBarry Smith } 505317ab2063SBarry Smith 5054d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5055d71ae5a4SJacob Faibussowitsch { 5056b24902e0SBarry Smith PetscFunctionBegin; 50579566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50589566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 505948a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50609566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50619566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5063b24902e0SBarry Smith } 5064b24902e0SBarry Smith 5065d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5066d71ae5a4SJacob Faibussowitsch { 506752f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 506852f91c60SVaclav Hapla 506952f91c60SVaclav Hapla PetscFunctionBegin; 507052f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 507152f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5072c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50739566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50749566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50759566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 507652f91c60SVaclav Hapla if (isbinary) { 50779566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 507852f91c60SVaclav Hapla } else if (ishdf5) { 507952f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50809566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 508152f91c60SVaclav Hapla #else 508252f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 508352f91c60SVaclav Hapla #endif 508452f91c60SVaclav Hapla } else { 508598921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 508652f91c60SVaclav Hapla } 50873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 508852f91c60SVaclav Hapla } 508952f91c60SVaclav Hapla 5090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5091d71ae5a4SJacob Faibussowitsch { 50923ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50933ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5094fbdbba38SShri Abhyankar 5095fbdbba38SShri Abhyankar PetscFunctionBegin; 50969566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5097bbead8a2SBarry Smith 50983ea6fe3dSLisandro Dalcin /* read in matrix header */ 50999566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 510008401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51019371c9d4SSatish Balay M = header[1]; 51029371c9d4SSatish Balay N = header[2]; 51039371c9d4SSatish Balay nz = header[3]; 510408401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 510508401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 510608401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5107fbdbba38SShri Abhyankar 51083ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51099566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51103ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51113ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51123ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51133ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51143ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51159566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51169566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51173ea6fe3dSLisandro Dalcin 51183ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51199566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5120aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51213ea6fe3dSLisandro Dalcin 5122fbdbba38SShri Abhyankar /* read in row lengths */ 51239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51249566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51253ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51269371c9d4SSatish Balay sum = 0; 51279371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 512808401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51293ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51319566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5132aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51333ea6fe3dSLisandro Dalcin /* store row lengths */ 51349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51359566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5136fbdbba38SShri Abhyankar 51373ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51389371c9d4SSatish Balay a->i[0] = 0; 51399371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51403ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51419566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51423ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51439566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5144fbdbba38SShri Abhyankar 51459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5148fbdbba38SShri Abhyankar } 5149fbdbba38SShri Abhyankar 5150d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5151d71ae5a4SJacob Faibussowitsch { 51527264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5153fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5154eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5155eeffb40dSHong Zhang PetscInt k; 5156eeffb40dSHong Zhang #endif 51577264ac53SSatish Balay 51583a40ed3dSBarry Smith PetscFunctionBegin; 5159bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5160d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5161ca44d042SBarry Smith *flg = PETSC_FALSE; 51623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5163bcd2baecSBarry Smith } 51647264ac53SSatish Balay 51657264ac53SSatish Balay /* if the a->i are the same */ 51669566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51673ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51687264ac53SSatish Balay 51697264ac53SSatish Balay /* if a->j are the same */ 51709566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51713ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5172bcd2baecSBarry Smith 51739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5175bcd2baecSBarry Smith /* if a->a are the same */ 5176eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5177eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5178fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5179eeffb40dSHong Zhang *flg = PETSC_FALSE; 51803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5181eeffb40dSHong Zhang } 5182eeffb40dSHong Zhang } 5183eeffb40dSHong Zhang #else 51849566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5185eeffb40dSHong Zhang #endif 51869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51897264ac53SSatish Balay } 519036db0b34SBarry Smith 519105869f15SSatish Balay /*@ 519211a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 519336db0b34SBarry Smith provided by the user. 519436db0b34SBarry Smith 5195d083f849SBarry Smith Collective 519636db0b34SBarry Smith 519736db0b34SBarry Smith Input Parameters: 519836db0b34SBarry Smith + comm - must be an MPI communicator of size 1 519936db0b34SBarry Smith . m - number of rows 520036db0b34SBarry Smith . n - number of columns 5201483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 520236db0b34SBarry Smith . j - column indices 520336db0b34SBarry Smith - a - matrix values 520436db0b34SBarry Smith 520536db0b34SBarry Smith Output Parameter: 520636db0b34SBarry Smith . mat - the matrix 520736db0b34SBarry Smith 520836db0b34SBarry Smith Level: intermediate 520936db0b34SBarry Smith 521036db0b34SBarry Smith Notes: 52112ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5212292fb18eSBarry Smith once the matrix is destroyed and not before 521336db0b34SBarry Smith 521436db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 521536db0b34SBarry Smith 52162ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 521736db0b34SBarry Smith 5218a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5219a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52208eef79e4SBarry Smith as shown 52212ef1f0ffSBarry Smith .vb 52222ef1f0ffSBarry Smith 1 0 0 52232ef1f0ffSBarry Smith 2 0 3 52242ef1f0ffSBarry Smith 4 5 6 5225a4552177SSatish Balay 52262ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52272ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52282ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52292ef1f0ffSBarry Smith .ve 5230a4552177SSatish Balay 52311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 523236db0b34SBarry Smith @*/ 5233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5234d71ae5a4SJacob Faibussowitsch { 5235cbcfb4deSHong Zhang PetscInt ii; 523636db0b34SBarry Smith Mat_SeqAIJ *aij; 5237cbcfb4deSHong Zhang PetscInt jj; 523836db0b34SBarry Smith 523936db0b34SBarry Smith PetscFunctionBegin; 5240aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52419566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52429566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52439566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52449566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5246ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5249ab93d7beSBarry Smith 525036db0b34SBarry Smith aij->i = i; 525136db0b34SBarry Smith aij->j = j; 525236db0b34SBarry Smith aij->a = a; 525336db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5254e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5255e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 525636db0b34SBarry Smith 5257cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 525836db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 525976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5260aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52619985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 526208401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 526308401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52649985e31cSBarry Smith } 526536db0b34SBarry Smith } 526676bd3646SJed Brown } 526776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 526836db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 526908401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5270da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 527136db0b34SBarry Smith } 527276bd3646SJed Brown } 527336db0b34SBarry Smith 52749566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52759566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 527736db0b34SBarry Smith } 5278cbc6b225SStefano Zampini 5279f62e3866SBarry Smith /*@ 528011a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52818a0b0e6bSVictor Minden provided by the user. 52828a0b0e6bSVictor Minden 5283d083f849SBarry Smith Collective 52848a0b0e6bSVictor Minden 52858a0b0e6bSVictor Minden Input Parameters: 52868a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52878a0b0e6bSVictor Minden . m - number of rows 52888a0b0e6bSVictor Minden . n - number of columns 52898a0b0e6bSVictor Minden . i - row indices 52908a0b0e6bSVictor Minden . j - column indices 52911230e6d1SVictor Minden . a - matrix values 52921230e6d1SVictor Minden . nz - number of nonzeros 52932ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 52948a0b0e6bSVictor Minden 52958a0b0e6bSVictor Minden Output Parameter: 52968a0b0e6bSVictor Minden . mat - the matrix 52978a0b0e6bSVictor Minden 52988a0b0e6bSVictor Minden Level: intermediate 52998a0b0e6bSVictor Minden 5300f62e3866SBarry Smith Example: 5301f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53029e99939fSJunchao Zhang .vb 53038a0b0e6bSVictor Minden 1 0 0 53048a0b0e6bSVictor Minden 2 0 3 53058a0b0e6bSVictor Minden 4 5 6 53068a0b0e6bSVictor Minden 53078a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53088a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53098a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53109e99939fSJunchao Zhang .ve 5311fe59aa6dSJacob Faibussowitsch 53122ef1f0ffSBarry Smith Note: 5313d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5314d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53158a0b0e6bSVictor Minden 53161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53178a0b0e6bSVictor Minden @*/ 5318d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5319d71ae5a4SJacob Faibussowitsch { 5320d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53218a0b0e6bSVictor Minden 53228a0b0e6bSVictor Minden PetscFunctionBegin; 53239566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5324ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53259566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53269566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53279566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53291230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53301230e6d1SVictor Minden if (idx) { 53311230e6d1SVictor Minden row = i[ii] - 1; 53321230e6d1SVictor Minden col = j[ii] - 1; 53331230e6d1SVictor Minden } else { 53341230e6d1SVictor Minden row = i[ii]; 53351230e6d1SVictor Minden col = j[ii]; 53368a0b0e6bSVictor Minden } 53379566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53388a0b0e6bSVictor Minden } 53399566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53409566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53419566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53438a0b0e6bSVictor Minden } 534436db0b34SBarry Smith 5345d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5346d71ae5a4SJacob Faibussowitsch { 5347acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5348acf2f550SJed Brown 5349acf2f550SJed Brown PetscFunctionBegin; 5350acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5351acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53522205254eSKarl Rupp 53539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5355acf2f550SJed Brown } 5356acf2f550SJed Brown 5357d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5358d71ae5a4SJacob Faibussowitsch { 53599c8f2541SHong Zhang PetscFunctionBegin; 53609566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53629c8f2541SHong Zhang } 53639c8f2541SHong Zhang 536481824310SBarry Smith /* 536553dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 536653dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 536753dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 536853dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 536953dd7562SDmitry Karpeev */ 5370d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5371d71ae5a4SJacob Faibussowitsch { 537253dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 537353dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 537453dd7562SDmitry Karpeev PetscBool seqaij; 537553dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 537653dd7562SDmitry Karpeev PetscScalar v; 537753dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 537853dd7562SDmitry Karpeev 537953dd7562SDmitry Karpeev PetscFunctionBegin; 53803ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 538153dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53829566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 538328b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 538453dd7562SDmitry Karpeev if (rowemb) { 53859566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 538608401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 538753dd7562SDmitry Karpeev } else { 538808401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 538953dd7562SDmitry Karpeev } 539053dd7562SDmitry Karpeev if (colemb) { 53919566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 539208401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 539353dd7562SDmitry Karpeev } else { 539408401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 539553dd7562SDmitry Karpeev } 539653dd7562SDmitry Karpeev 5397f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 539853dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5400ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54029566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 540353dd7562SDmitry Karpeev } 540448a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 540553dd7562SDmitry Karpeev count = 0; 540653dd7562SDmitry Karpeev rowindices = NULL; 540753dd7562SDmitry Karpeev colindices = NULL; 540848a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 540948a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 541053dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 541153dd7562SDmitry Karpeev PetscInt row; 541253dd7562SDmitry Karpeev row = i; 541353dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 541453dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 541553dd7562SDmitry Karpeev PetscInt col; 541653dd7562SDmitry Karpeev col = Baij->j[count]; 541753dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 541853dd7562SDmitry Karpeev v = Baij->a[count]; 54199566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 542053dd7562SDmitry Karpeev ++count; 542153dd7562SDmitry Karpeev } 542253dd7562SDmitry Karpeev } 542353dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 542453dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 542553dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 542653dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 542753dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 542953dd7562SDmitry Karpeev } 543053dd7562SDmitry Karpeev 543158c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5432dec0b466SHong Zhang { 5433dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5434dec0b466SHong Zhang MatScalar *aa = a->a; 5435dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5436dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5437dec0b466SHong Zhang 5438dec0b466SHong Zhang PetscFunctionBegin; 5439dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5440dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5441dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5442dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5443dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 544458c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5445dec0b466SHong Zhang else { 5446dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5447dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5448dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5449dec0b466SHong Zhang } 5450dec0b466SHong Zhang } 5451dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5452dec0b466SHong Zhang fshift_prev = fshift; 5453dec0b466SHong Zhang /* reset ilen and imax for each row */ 5454dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5455dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5456dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5457dec0b466SHong Zhang } 5458312eded4SPierre Jolivet if (fshift) { 5459dec0b466SHong Zhang if (m) { 5460dec0b466SHong Zhang ai[m] -= fshift; 5461dec0b466SHong Zhang a->nz = ai[m]; 5462dec0b466SHong Zhang } 5463dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5464312eded4SPierre Jolivet A->nonzerostate++; 5465dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5466dec0b466SHong Zhang a->rmax = rmax; 5467dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5468dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5469dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5470312eded4SPierre Jolivet } 54713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5472dec0b466SHong Zhang } 5473dec0b466SHong Zhang 54744099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54754099cc6bSBarry Smith 5476cc4c1da9SBarry Smith /*@ 547711a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54784099cc6bSBarry Smith 5479c3339decSBarry Smith Collective 54804099cc6bSBarry Smith 54814099cc6bSBarry Smith Input Parameters: 54824099cc6bSBarry Smith + mat - the matrix object 54834099cc6bSBarry Smith - matype - matrix type 54844099cc6bSBarry Smith 54854099cc6bSBarry Smith Options Database Key: 54864e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54874099cc6bSBarry Smith 54884099cc6bSBarry Smith Level: intermediate 54894099cc6bSBarry Smith 5490fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 54914099cc6bSBarry Smith @*/ 5492d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5493d71ae5a4SJacob Faibussowitsch { 54944099cc6bSBarry Smith PetscBool sametype; 54955f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 54964099cc6bSBarry Smith 54974099cc6bSBarry Smith PetscFunctionBegin; 54984099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 54999566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55003ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55014099cc6bSBarry Smith 55029566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55036adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55049566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55064099cc6bSBarry Smith } 55074099cc6bSBarry Smith 55084099cc6bSBarry Smith /*@C 550911a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55104099cc6bSBarry Smith 5511cc4c1da9SBarry Smith Not Collective, No Fortran Support 55124099cc6bSBarry Smith 55134099cc6bSBarry Smith Input Parameters: 5514fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55154099cc6bSBarry Smith - function - routine to convert to subtype 55164099cc6bSBarry Smith 55172ef1f0ffSBarry Smith Level: advanced 55182ef1f0ffSBarry Smith 55194099cc6bSBarry Smith Notes: 552011a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55214099cc6bSBarry Smith 55224099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55234099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55244099cc6bSBarry Smith 55251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55264099cc6bSBarry Smith @*/ 5527d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5528d71ae5a4SJacob Faibussowitsch { 55294099cc6bSBarry Smith PetscFunctionBegin; 55309566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55319566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55334099cc6bSBarry Smith } 55344099cc6bSBarry Smith 55354099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55364099cc6bSBarry Smith 55374099cc6bSBarry Smith /*@C 553811a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55394099cc6bSBarry Smith 55404099cc6bSBarry Smith Not Collective 55414099cc6bSBarry Smith 55424099cc6bSBarry Smith Level: advanced 55434099cc6bSBarry Smith 55442ef1f0ffSBarry Smith Note: 55452ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55462ef1f0ffSBarry Smith 55471cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55484099cc6bSBarry Smith @*/ 5549d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5550d71ae5a4SJacob Faibussowitsch { 55514099cc6bSBarry Smith PetscFunctionBegin; 55523ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55534099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55544099cc6bSBarry Smith 55559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55589779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5560485f9817SRichard Tran Mills #endif 55615063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55635063d097SStefano Zampini #endif 5564d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5565d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5566d5e393b6SSuyash Tandon #endif 55675063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55695063d097SStefano Zampini #endif 55704099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55724099cc6bSBarry Smith #endif 55733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55744099cc6bSBarry Smith } 557553dd7562SDmitry Karpeev 557653dd7562SDmitry Karpeev /* 557781824310SBarry Smith Special version for direct calls from Fortran 557881824310SBarry Smith */ 557981824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 558081824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 558181824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 558281824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 558381824310SBarry Smith #endif 558481824310SBarry Smith 558581824310SBarry Smith /* Change these macros so can be used in void function */ 558698921bdaSJacob Faibussowitsch 558798921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55889566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55899566063dSJacob Faibussowitsch #undef PetscCall 55909371c9d4SSatish Balay #define PetscCall(...) \ 55919371c9d4SSatish Balay do { \ 55925f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 559398921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 559498921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 559598921bdaSJacob Faibussowitsch return; \ 559698921bdaSJacob Faibussowitsch } \ 559798921bdaSJacob Faibussowitsch } while (0) 559898921bdaSJacob Faibussowitsch 559998921bdaSJacob Faibussowitsch #undef SETERRQ 56009371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56019371c9d4SSatish Balay do { \ 560298921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 560398921bdaSJacob Faibussowitsch return; \ 560498921bdaSJacob Faibussowitsch } while (0) 560581824310SBarry Smith 5606d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5607d71ae5a4SJacob Faibussowitsch { 560881824310SBarry Smith Mat A = *AA; 560981824310SBarry Smith PetscInt m = *mm, n = *nn; 561081824310SBarry Smith InsertMode is = *isis; 561181824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 561281824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 561381824310SBarry Smith PetscInt *imax, *ai, *ailen; 561481824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 561554f21887SBarry Smith MatScalar *ap, value, *aa; 5616ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5617ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 561881824310SBarry Smith 561981824310SBarry Smith PetscFunctionBegin; 56204994cf47SJed Brown MatCheckPreallocated(A, 1); 562181824310SBarry Smith imax = a->imax; 562281824310SBarry Smith ai = a->i; 562381824310SBarry Smith ailen = a->ilen; 562481824310SBarry Smith aj = a->j; 562581824310SBarry Smith aa = a->a; 562681824310SBarry Smith 562781824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 562881824310SBarry Smith row = im[k]; 562981824310SBarry Smith if (row < 0) continue; 56305f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56319371c9d4SSatish Balay rp = aj + ai[row]; 56329371c9d4SSatish Balay ap = aa + ai[row]; 56339371c9d4SSatish Balay rmax = imax[row]; 56349371c9d4SSatish Balay nrow = ailen[row]; 563581824310SBarry Smith low = 0; 563681824310SBarry Smith high = nrow; 563781824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 563881824310SBarry Smith if (in[l] < 0) continue; 56395f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 564081824310SBarry Smith col = in[l]; 56412205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56422205254eSKarl Rupp else value = v[k + l * m]; 56432205254eSKarl Rupp 564481824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 564581824310SBarry Smith 56462205254eSKarl Rupp if (col <= lastcol) low = 0; 56472205254eSKarl Rupp else high = nrow; 564881824310SBarry Smith lastcol = col; 564981824310SBarry Smith while (high - low > 5) { 565081824310SBarry Smith t = (low + high) / 2; 565181824310SBarry Smith if (rp[t] > col) high = t; 565281824310SBarry Smith else low = t; 565381824310SBarry Smith } 565481824310SBarry Smith for (i = low; i < high; i++) { 565581824310SBarry Smith if (rp[i] > col) break; 565681824310SBarry Smith if (rp[i] == col) { 565781824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 565881824310SBarry Smith else ap[i] = value; 565981824310SBarry Smith goto noinsert; 566081824310SBarry Smith } 566181824310SBarry Smith } 566281824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 566381824310SBarry Smith if (nonew == 1) goto noinsert; 56645f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5665fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56669371c9d4SSatish Balay N = nrow++ - 1; 56679371c9d4SSatish Balay a->nz++; 56689371c9d4SSatish Balay high++; 566981824310SBarry Smith /* shift up all the later entries in this row */ 567081824310SBarry Smith for (ii = N; ii >= i; ii--) { 567181824310SBarry Smith rp[ii + 1] = rp[ii]; 567281824310SBarry Smith ap[ii + 1] = ap[ii]; 567381824310SBarry Smith } 567481824310SBarry Smith rp[i] = col; 567581824310SBarry Smith ap[i] = value; 567681824310SBarry Smith noinsert:; 567781824310SBarry Smith low = i + 1; 567881824310SBarry Smith } 567981824310SBarry Smith ailen[row] = nrow; 568081824310SBarry Smith } 568181824310SBarry Smith PetscFunctionReturnVoid(); 568281824310SBarry Smith } 568398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 568498921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 568598921bdaSJacob Faibussowitsch * original definitions */ 56869566063dSJacob Faibussowitsch #undef PetscCall 568798921bdaSJacob Faibussowitsch #undef SETERRQ 5688