1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 4188e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 4198e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e44c0bd4SBarry Smith noinsert:; 47217ab2063SBarry Smith } 47317ab2063SBarry Smith ailen[row] = nrow; 47417ab2063SBarry Smith } 4759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47717ab2063SBarry Smith } 47817ab2063SBarry Smith 479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 480d71ae5a4SJacob Faibussowitsch { 48119b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48219b08ed1SBarry Smith PetscInt *rp, k, row; 48319b08ed1SBarry Smith PetscInt *ai = a->i; 48419b08ed1SBarry Smith PetscInt *aj = a->j; 485fff043a9SJunchao Zhang MatScalar *aa, *ap; 48619b08ed1SBarry Smith 48719b08ed1SBarry Smith PetscFunctionBegin; 48828b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 48908401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 490fff043a9SJunchao Zhang 4919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49219b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49319b08ed1SBarry Smith row = im[k]; 49419b08ed1SBarry Smith rp = aj + ai[row]; 4958e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49619b08ed1SBarry Smith 4979566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49819b08ed1SBarry Smith if (!A->structure_only) { 49919b08ed1SBarry Smith if (v) { 5009566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50119b08ed1SBarry Smith v += n; 50219b08ed1SBarry Smith } else { 5039566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50419b08ed1SBarry Smith } 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith a->ilen[row] = n; 50719b08ed1SBarry Smith a->imax[row] = n; 50819b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 50919b08ed1SBarry Smith a->nz += n; 51019b08ed1SBarry Smith } 5119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51319b08ed1SBarry Smith } 51419b08ed1SBarry Smith 51519b08ed1SBarry Smith /*@ 51619b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51719b08ed1SBarry Smith 51819b08ed1SBarry Smith Input Parameters: 51911a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52119b08ed1SBarry Smith 52219b08ed1SBarry Smith Level: advanced 52319b08ed1SBarry Smith 52419b08ed1SBarry Smith Notes: 52519b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52611a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52719b08ed1SBarry Smith as always with multiple matrix assemblies. 52819b08ed1SBarry Smith 5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53019b08ed1SBarry Smith @*/ 531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 532d71ae5a4SJacob Faibussowitsch { 53319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53419b08ed1SBarry Smith 53519b08ed1SBarry Smith PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53819b08ed1SBarry Smith a->maxnz = nztotal; 5394dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54019b08ed1SBarry Smith if (!a->ilen) { 5419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54219b08ed1SBarry Smith } else { 5439566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54419b08ed1SBarry Smith } 54519b08ed1SBarry Smith 54619b08ed1SBarry Smith /* allocate the matrix space */ 5479f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i)); 5489f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j)); 5499f0612e4SBarry Smith a->free_ij = PETSC_TRUE; 55019b08ed1SBarry Smith if (A->structure_only) { 55119b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55219b08ed1SBarry Smith } else { 5539f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a)); 55419b08ed1SBarry Smith a->free_a = PETSC_TRUE; 55519b08ed1SBarry Smith } 5569f0612e4SBarry Smith a->i[0] = 0; 55719b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 55819b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56019b08ed1SBarry Smith } 56119b08ed1SBarry Smith 562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 563d71ae5a4SJacob Faibussowitsch { 564071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 565071fcb05SBarry Smith PetscInt *rp, k, row; 566071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567071fcb05SBarry Smith PetscInt *aj = a->j; 568fff043a9SJunchao Zhang MatScalar *aa, *ap; 569071fcb05SBarry Smith 570071fcb05SBarry Smith PetscFunctionBegin; 5719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 572071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 573071fcb05SBarry Smith row = im[k]; 5746bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 575071fcb05SBarry Smith rp = aj + ai[row]; 576071fcb05SBarry Smith ap = aa + ai[row]; 57748a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 578071fcb05SBarry Smith if (!A->structure_only) { 579071fcb05SBarry Smith if (v) { 5809566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 581071fcb05SBarry Smith v += n; 582071fcb05SBarry Smith } else { 5839566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 584071fcb05SBarry Smith } 585071fcb05SBarry Smith } 586071fcb05SBarry Smith ailen[row] = n; 587071fcb05SBarry Smith a->nz += n; 588071fcb05SBarry Smith } 5899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 591071fcb05SBarry Smith } 592071fcb05SBarry Smith 593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 594d71ae5a4SJacob Faibussowitsch { 5957eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 59697f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59797f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 5984e208921SJed Brown const MatScalar *ap, *aa; 5997eb43aa7SLois Curfman McInnes 6003a40ed3dSBarry Smith PetscFunctionBegin; 6014e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6027eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6037eb43aa7SLois Curfman McInnes row = im[k]; 6049371c9d4SSatish Balay if (row < 0) { 6059371c9d4SSatish Balay v += n; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative row */ 60854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 6098e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 6108e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6117eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6127eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6139371c9d4SSatish Balay if (in[l] < 0) { 6149371c9d4SSatish Balay v++; 6159371c9d4SSatish Balay continue; 6169371c9d4SSatish Balay } /* negative column */ 61754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 618bfeeae90SHong Zhang col = in[l]; 6199371c9d4SSatish Balay high = nrow; 6209371c9d4SSatish Balay low = 0; /* assume unsorted */ 6217eb43aa7SLois Curfman McInnes while (high - low > 5) { 6227eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6237eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6247eb43aa7SLois Curfman McInnes else low = t; 6257eb43aa7SLois Curfman McInnes } 6267eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6277eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6287eb43aa7SLois Curfman McInnes if (rp[i] == col) { 629b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6307eb43aa7SLois Curfman McInnes goto finished; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes } 63397e567efSBarry Smith *v++ = 0.0; 6347eb43aa7SLois Curfman McInnes finished:; 6357eb43aa7SLois Curfman McInnes } 6367eb43aa7SLois Curfman McInnes } 6374e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6397eb43aa7SLois Curfman McInnes } 6407eb43aa7SLois Curfman McInnes 641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 642d71ae5a4SJacob Faibussowitsch { 6433ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 644c898d852SStefano Zampini const PetscScalar *av; 6453ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6463ea6fe3dSLisandro Dalcin PetscInt *rowlens; 64717ab2063SBarry Smith 6483a40ed3dSBarry Smith PetscFunctionBegin; 6499566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6502205254eSKarl Rupp 6513ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6523ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6533ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6543ea6fe3dSLisandro Dalcin nz = A->nz; 655416022c9SBarry Smith 6563ea6fe3dSLisandro Dalcin /* write matrix header */ 6573ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6589371c9d4SSatish Balay header[1] = M; 6599371c9d4SSatish Balay header[2] = N; 6609371c9d4SSatish Balay header[3] = nz; 6619566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 662416022c9SBarry Smith 6633ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6653ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 666e457bb90SBarry Smith if (PetscDefined(USE_DEBUG)) { 667e457bb90SBarry Smith PetscInt mnz = 0; 668e457bb90SBarry Smith 669e457bb90SBarry Smith for (i = 0; i < m; i++) mnz += rowlens[i]; 670e457bb90SBarry Smith PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz); 671e457bb90SBarry Smith } 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 719bd6a2ce3SJunchao Zhang // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries 7203ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7212e5835c6SStefano Zampini 722c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72571c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72697f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72760e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 728c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 729d00d2cf4SBarry Smith nofinalvalue = 1; 730d00d2cf4SBarry Smith } 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 736fbfe6fa7SJed Brown #else 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 738fbfe6fa7SJed Brown #endif 7399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 74017ab2063SBarry Smith 74117ab2063SBarry Smith for (i = 0; i < m; i++) { 74260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74517ab2063SBarry Smith #else 7469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74717ab2063SBarry Smith #endif 74817ab2063SBarry Smith } 74917ab2063SBarry Smith } 750d00d2cf4SBarry Smith if (nofinalvalue) { 751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 753c337ccceSJed Brown #else 7549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 755c337ccceSJed Brown #endif 756d00d2cf4SBarry Smith } 7579566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 760fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76244cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76460e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76636db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76836db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 77036db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7726831982aSBarry Smith } 77344cd7ae7SLois Curfman McInnes #else 7749566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77544cd7ae7SLois Curfman McInnes #endif 77644cd7ae7SLois Curfman McInnes } 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77844cd7ae7SLois Curfman McInnes } 7799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 780fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78197f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7839566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 784496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 785496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 787496be53dSLois Curfman McInnes if (a->j[j] >= i) { 788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78936db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 790496be53dSLois Curfman McInnes #else 791496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 792496be53dSLois Curfman McInnes #endif 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 795496be53dSLois Curfman McInnes } 7962e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7982e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7992205254eSKarl Rupp if (i + 4 < m) { 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8012205254eSKarl Rupp } else if (i + 3 < m) { 8029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8032205254eSKarl Rupp } else if (i + 2 < m) { 8049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8052205254eSKarl Rupp } else if (i + 1 < m) { 8069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8072205254eSKarl Rupp } else if (i < m) { 8089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8092205254eSKarl Rupp } else { 8109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8112205254eSKarl Rupp } 812496be53dSLois Curfman McInnes } 8139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8149566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 815496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8179566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 818496be53dSLois Curfman McInnes } 8199566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 820496be53dSLois Curfman McInnes } 8219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 822496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 824496be53dSLois Curfman McInnes if (a->j[j] >= i) { 825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82648a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 827496be53dSLois Curfman McInnes #else 8289566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 829496be53dSLois Curfman McInnes #endif 830496be53dSLois Curfman McInnes } 831496be53dSLois Curfman McInnes } 8329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 833496be53dSLois Curfman McInnes } 8349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 835fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83697f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83787828ca2SBarry Smith PetscScalar value; 83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83968f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 84068f1ed48SBarry Smith 84168f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84268f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84368f1ed48SBarry Smith realonly = PETSC_FALSE; 84468f1ed48SBarry Smith break; 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith } 84768f1ed48SBarry Smith #endif 84802594712SBarry Smith 8499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 85002594712SBarry Smith for (i = 0; i < m; i++) { 85102594712SBarry Smith jcnt = 0; 852d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 853e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85402594712SBarry Smith value = a->a[cnt++]; 855e24b481bSBarry Smith jcnt++; 85602594712SBarry Smith } else { 85702594712SBarry Smith value = 0.0; 85802594712SBarry Smith } 859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 86068f1ed48SBarry Smith if (realonly) { 8619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86268f1ed48SBarry Smith } else { 8639566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86468f1ed48SBarry Smith } 86502594712SBarry Smith #else 8669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86702594712SBarry Smith #endif 86802594712SBarry Smith } 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 87002594712SBarry Smith } 8719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8723c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 873150b93efSMatthew G. Knepley PetscInt fshift = 1; 8749566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8773c215bfdSMatthew Knepley #else 8789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8793c215bfdSMatthew Knepley #endif 8809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8813c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8853c215bfdSMatthew Knepley #else 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8873c215bfdSMatthew Knepley #endif 8883c215bfdSMatthew Knepley } 8893c215bfdSMatthew Knepley } 8909566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8913a40ed3dSBarry Smith } else { 8929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 893d5f3da31SBarry Smith if (A->factortype) { 89416cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89616cd7e1dSShri Abhyankar /* L part */ 89760e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90316cd7e1dSShri Abhyankar } else { 9049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90516cd7e1dSShri Abhyankar } 90616cd7e1dSShri Abhyankar #else 9079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90816cd7e1dSShri Abhyankar #endif 90916cd7e1dSShri Abhyankar } 91016cd7e1dSShri Abhyankar /* diagonal */ 91116cd7e1dSShri Abhyankar j = a->diag[i]; 91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91716cd7e1dSShri Abhyankar } else { 9189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91916cd7e1dSShri Abhyankar } 92016cd7e1dSShri Abhyankar #else 9219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92216cd7e1dSShri Abhyankar #endif 92316cd7e1dSShri Abhyankar 92416cd7e1dSShri Abhyankar /* U part */ 92560e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93116cd7e1dSShri Abhyankar } else { 9329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93316cd7e1dSShri Abhyankar } 93416cd7e1dSShri Abhyankar #else 9359566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93616cd7e1dSShri Abhyankar #endif 93716cd7e1dSShri Abhyankar } 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93916cd7e1dSShri Abhyankar } 94016cd7e1dSShri Abhyankar } else { 94117ab2063SBarry Smith for (i = 0; i < m; i++) { 9429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9493a40ed3dSBarry Smith } else { 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95117ab2063SBarry Smith } 95217ab2063SBarry Smith #else 9539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95417ab2063SBarry Smith #endif 95517ab2063SBarry Smith } 9569566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95717ab2063SBarry Smith } 95816cd7e1dSShri Abhyankar } 9599566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 96017ab2063SBarry Smith } 9619566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 963416022c9SBarry Smith } 964416022c9SBarry Smith 9659804daf3SBarry Smith #include <petscdraw.h> 966ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 967d71ae5a4SJacob Faibussowitsch { 968480ef9eaSBarry Smith Mat A = (Mat)Aa; 969416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 970383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 971383922c3SLisandro Dalcin int color; 972b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 973b0a32e0cSBarry Smith PetscViewer viewer; 974f3ef73ceSBarry Smith PetscViewerFormat format; 975fff043a9SJunchao Zhang const PetscScalar *aa; 976cddf8d76SBarry Smith 9773a40ed3dSBarry Smith PetscFunctionBegin; 9789566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9799566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9809566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 981383922c3SLisandro Dalcin 982416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 984fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 985d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9860513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 987b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 988416022c9SBarry Smith for (i = 0; i < m; i++) { 9899371c9d4SSatish Balay y_l = m - i - 1.0; 9909371c9d4SSatish Balay y_r = y_l + 1.0; 991bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9929371c9d4SSatish Balay x_l = a->j[j]; 9939371c9d4SSatish Balay x_r = x_l + 1.0; 994fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9959566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 996cddf8d76SBarry Smith } 997cddf8d76SBarry Smith } 998b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 999cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10009371c9d4SSatish Balay y_l = m - i - 1.0; 10019371c9d4SSatish Balay y_r = y_l + 1.0; 1002bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10039371c9d4SSatish Balay x_l = a->j[j]; 10049371c9d4SSatish Balay x_r = x_l + 1.0; 1005fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1007cddf8d76SBarry Smith } 1008cddf8d76SBarry Smith } 1009b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1010cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10119371c9d4SSatish Balay y_l = m - i - 1.0; 10129371c9d4SSatish Balay y_r = y_l + 1.0; 1013bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10149371c9d4SSatish Balay x_l = a->j[j]; 10159371c9d4SSatish Balay x_r = x_l + 1.0; 1016fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10179566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1018416022c9SBarry Smith } 1019416022c9SBarry Smith } 1020d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10210513a670SBarry Smith } else { 10220513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10230513a670SBarry Smith /* first determine max of all nonzero values */ 1024b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1025383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1026b0a32e0cSBarry Smith PetscDraw popup; 10270513a670SBarry Smith 10280513a670SBarry Smith for (i = 0; i < nz; i++) { 1029fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10300513a670SBarry Smith } 1031383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10339566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1034383922c3SLisandro Dalcin 1035d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10360513a670SBarry Smith for (i = 0; i < m; i++) { 1037383922c3SLisandro Dalcin y_l = m - i - 1.0; 1038383922c3SLisandro Dalcin y_r = y_l + 1.0; 1039bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1040383922c3SLisandro Dalcin x_l = a->j[j]; 1041383922c3SLisandro Dalcin x_r = x_l + 1.0; 1042fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10439566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10440513a670SBarry Smith count++; 10450513a670SBarry Smith } 10460513a670SBarry Smith } 1047d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10480513a670SBarry Smith } 10499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1051480ef9eaSBarry Smith } 1052cddf8d76SBarry Smith 10539804daf3SBarry Smith #include <petscdraw.h> 1054ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1055d71ae5a4SJacob Faibussowitsch { 1056b0a32e0cSBarry Smith PetscDraw draw; 105736db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1058ace3abfcSBarry Smith PetscBool isnull; 1059480ef9eaSBarry Smith 1060480ef9eaSBarry Smith PetscFunctionBegin; 10619566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10629566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10633ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1064480ef9eaSBarry Smith 10659371c9d4SSatish Balay xr = A->cmap->n; 10669371c9d4SSatish Balay yr = A->rmap->n; 10679371c9d4SSatish Balay h = yr / 10.0; 10689371c9d4SSatish Balay w = xr / 10.0; 10699371c9d4SSatish Balay xr += w; 10709371c9d4SSatish Balay yr += h; 10719371c9d4SSatish Balay xl = -w; 10729371c9d4SSatish Balay yl = -h; 10739566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10749566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10759566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10769566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10779566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1079416022c9SBarry Smith } 1080416022c9SBarry Smith 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1082d71ae5a4SJacob Faibussowitsch { 1083ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1084416022c9SBarry Smith 10853a40ed3dSBarry Smith PetscFunctionBegin; 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10891baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10901baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10911baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10929566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109417ab2063SBarry Smith } 109519bcc07fSBarry Smith 1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1097d71ae5a4SJacob Faibussowitsch { 1098416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1099580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1100bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 110154f21887SBarry Smith MatScalar *aa = a->a, *ap; 11023447b6efSHong Zhang PetscReal ratio = 0.6; 110317ab2063SBarry Smith 11043a40ed3dSBarry Smith PetscFunctionBegin; 11053ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1107b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1108b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11099566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111b215bc84SStefano Zampini } 111217ab2063SBarry Smith 111343ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111417ab2063SBarry Smith for (i = 1; i < m; i++) { 1115416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111617ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111794a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111817ab2063SBarry Smith if (fshift) { 1119bfeeae90SHong Zhang ip = aj + ai[i]; 1120bfeeae90SHong Zhang ap = aa + ai[i]; 112117ab2063SBarry Smith N = ailen[i]; 11229566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112348a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112417ab2063SBarry Smith } 112517ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112617ab2063SBarry Smith } 112717ab2063SBarry Smith if (m) { 112817ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112917ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 113017ab2063SBarry Smith } 113117ab2063SBarry Smith /* reset ilen and imax for each row */ 11327b083b7cSBarry Smith a->nonzerorowcnt = 0; 1133396832f4SHong Zhang if (A->structure_only) { 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11359566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1136396832f4SHong Zhang } else { /* !A->structure_only */ 113717ab2063SBarry Smith for (i = 0; i < m; i++) { 113817ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11397b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 114017ab2063SBarry Smith } 1141396832f4SHong Zhang } 1142bfeeae90SHong Zhang a->nz = ai[m]; 1143aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1144bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1145bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1146bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1147bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1148bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1149bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1150bc43efbbSJunchao Zhang break; 1151bc43efbbSJunchao Zhang } 1152bc43efbbSJunchao Zhang } 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11559566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11562205254eSKarl Rupp 11578e58a170SBarry Smith A->info.mallocs += a->reallocs; 1158dd5f02e7SSatish Balay a->reallocs = 0; 11596712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 116036db0b34SBarry Smith a->rmax = rmax; 11614e220ebcSLois Curfman McInnes 116248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11639566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116517ab2063SBarry Smith } 116617ab2063SBarry Smith 1167ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1168d71ae5a4SJacob Faibussowitsch { 116999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 117099cafbc1SBarry Smith PetscInt i, nz = a->nz; 11712e5835c6SStefano Zampini MatScalar *aa; 117299cafbc1SBarry Smith 117399cafbc1SBarry Smith PetscFunctionBegin; 11749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117999cafbc1SBarry Smith } 118099cafbc1SBarry Smith 1181ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1182d71ae5a4SJacob Faibussowitsch { 118399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118499cafbc1SBarry Smith PetscInt i, nz = a->nz; 11852e5835c6SStefano Zampini MatScalar *aa; 118699cafbc1SBarry Smith 118799cafbc1SBarry Smith PetscFunctionBegin; 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119399cafbc1SBarry Smith } 119499cafbc1SBarry Smith 1195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1196d71ae5a4SJacob Faibussowitsch { 1197fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1198fff043a9SJunchao Zhang MatScalar *aa; 11993a40ed3dSBarry Smith 12003a40ed3dSBarry Smith PetscFunctionBegin; 12019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12029566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120617ab2063SBarry Smith } 1207416022c9SBarry Smith 1208d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1209d71ae5a4SJacob Faibussowitsch { 1210416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1211d5d45c9bSBarry Smith 12123a40ed3dSBarry Smith PetscFunctionBegin; 1213b4e2f619SBarry Smith if (A->hash_active) { 1214e3c72094SPierre Jolivet A->ops[0] = a->cops; 1215b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1216b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1217b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1218b4e2f619SBarry Smith } 1219b4e2f619SBarry Smith 12203ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12219566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12309566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12319566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12339566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12349566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12359566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1236901853e0SKris Buschelman 12376718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12386718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12396718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12406718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12416718818eSStefano Zampini due to different matrix sizes */ 12429566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12436718818eSStefano Zampini 12449566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12462e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12532e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12542e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12552e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12562e956fe4SStefano Zampini #endif 12574222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12614222ddf1SHong Zhang #endif 1262d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1264d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1265d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1266d5e393b6SSuyash Tandon #endif 12673d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12693d0639e7SStefano Zampini #endif 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1271af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1273af8000cdSHong Zhang #endif 1274d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1276d24d4204SJose E. Roman #endif 127763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 128063c07aadSStefano Zampini #endif 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12962e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12972e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13022e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130417ab2063SBarry Smith } 130517ab2063SBarry Smith 1306d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1307d71ae5a4SJacob Faibussowitsch { 1308416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13093a40ed3dSBarry Smith 13103a40ed3dSBarry Smith PetscFunctionBegin; 1311a65d3064SKris Buschelman switch (op) { 1312d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1313d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1314d71ae5a4SJacob Faibussowitsch break; 1315d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1316d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1317d71ae5a4SJacob Faibussowitsch break; 1318d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1319d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1320d71ae5a4SJacob Faibussowitsch break; 1321d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1322d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1323d71ae5a4SJacob Faibussowitsch break; 1324d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1325d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1326d71ae5a4SJacob Faibussowitsch break; 1327d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1328d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1329d71ae5a4SJacob Faibussowitsch break; 1330d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1331d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1332d71ae5a4SJacob Faibussowitsch break; 13333d472b54SHong Zhang case MAT_SPD: 1334b1646e73SJed Brown case MAT_SYMMETRIC: 1335b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1336b1646e73SJed Brown case MAT_HERMITIAN: 1337b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1338957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1339b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1340b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 13415021d80fSJed Brown break; 13428c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1343a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1344d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1345d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1348d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1349d71ae5a4SJacob Faibussowitsch break; 1350d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1351d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353071fcb05SBarry Smith case MAT_SORTED_FULL: 1354071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1355071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1356071fcb05SBarry Smith break; 1357d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1358d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch default: 1361d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1362a65d3064SKris Buschelman } 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136417ab2063SBarry Smith } 136517ab2063SBarry Smith 1366ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1367d71ae5a4SJacob Faibussowitsch { 1368416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1369fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1370c898d852SStefano Zampini PetscScalar *x; 1371c898d852SStefano Zampini const PetscScalar *aa; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1377d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1378d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13802c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138435e7444dSHong Zhang } 138535e7444dSHong Zhang 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138735e7444dSHong Zhang for (i = 0; i < n; i++) { 1388fdc842d1SBarry Smith x[i] = 0.0; 138935e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139035e7444dSHong Zhang if (aj[j] == i) { 139135e7444dSHong Zhang x[i] = aa[j]; 139217ab2063SBarry Smith break; 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 139517ab2063SBarry Smith } 13969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139917ab2063SBarry Smith } 140017ab2063SBarry Smith 1401c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1403d71ae5a4SJacob Faibussowitsch { 1404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14055f22a7b3SSebastian Grimberg const MatScalar *aa; 1406d9ca1df4SBarry Smith PetscScalar *y; 1407d9ca1df4SBarry Smith const PetscScalar *x; 1408d0f46423SBarry Smith PetscInt m = A->rmap->n; 14095c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14105f22a7b3SSebastian Grimberg const MatScalar *v; 1411a77337e4SBarry Smith PetscScalar alpha; 1412d9ca1df4SBarry Smith PetscInt n, i, j; 1413d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14143447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1415ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14165c897100SBarry Smith #endif 141717ab2063SBarry Smith 14183a40ed3dSBarry Smith PetscFunctionBegin; 14199566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14219566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14235c897100SBarry Smith 14245c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1425fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14265c897100SBarry Smith #else 14273447b6efSHong Zhang if (usecprow) { 14283447b6efSHong Zhang m = cprow.nrows; 14293447b6efSHong Zhang ii = cprow.i; 14307b2bb3b9SHong Zhang ridx = cprow.rindex; 14313447b6efSHong Zhang } else { 14323447b6efSHong Zhang ii = a->i; 14333447b6efSHong Zhang } 143417ab2063SBarry Smith for (i = 0; i < m; i++) { 14353447b6efSHong Zhang idx = a->j + ii[i]; 1436fff043a9SJunchao Zhang v = aa + ii[i]; 14373447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14383447b6efSHong Zhang if (usecprow) { 14397b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14403447b6efSHong Zhang } else { 144117ab2063SBarry Smith alpha = x[i]; 14423447b6efSHong Zhang } 144304fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144417ab2063SBarry Smith } 14455c897100SBarry Smith #endif 14469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145117ab2063SBarry Smith } 145217ab2063SBarry Smith 1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1454d71ae5a4SJacob Faibussowitsch { 14555c897100SBarry Smith PetscFunctionBegin; 14569566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14579566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14595c897100SBarry Smith } 14605c897100SBarry Smith 1461c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146278b84d54SShri Abhyankar 1463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1464d71ae5a4SJacob Faibussowitsch { 1465416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1466d9fead3dSBarry Smith PetscScalar *y; 146754f21887SBarry Smith const PetscScalar *x; 14685914357eSBarry Smith const MatScalar *a_a; 1469003131ecSBarry Smith PetscInt m = A->rmap->n; 14705914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 1471ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147217ab2063SBarry Smith 1473b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147497952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1475fee21e36SBarry Smith #endif 1476fee21e36SBarry Smith 14773a40ed3dSBarry Smith PetscFunctionBegin; 1478b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14799566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1481b215bc84SStefano Zampini } 14829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14839566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14849566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1485416022c9SBarry Smith ii = a->i; 14864eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 148897952fefSHong Zhang m = a->compressedrow.nrows; 148997952fefSHong Zhang ii = a->compressedrow.i; 149097952fefSHong Zhang ridx = a->compressedrow.rindex; 14915914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 14925914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 14935914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 14945914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 14955914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 14965914357eSBarry Smith PetscScalar sum = 0.0; 1497003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1498003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149997952fefSHong Zhang y[*ridx++] = sum; 150097952fefSHong Zhang } 150197952fefSHong Zhang } else { /* do not use compressed row format */ 1502b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15035914357eSBarry Smith fortranmultaij_(&m, x, ii, a->j, a_a, y); 1504b05257ddSBarry Smith #else 15055914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 15065914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 15075914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 15085914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 15095914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 15105914357eSBarry Smith PetscScalar sum = 0.0; 1511003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151217ab2063SBarry Smith y[i] = sum; 151317ab2063SBarry Smith } 15148d195f9aSBarry Smith #endif 1515b05257ddSBarry Smith } 15169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15179566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152117ab2063SBarry Smith } 152217ab2063SBarry Smith 1523ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1524ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1525d71ae5a4SJacob Faibussowitsch { 1526b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1527b434eb95SMatthew G. Knepley PetscScalar *y; 1528b434eb95SMatthew G. Knepley const PetscScalar *x; 1529fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1530b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1531b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1532b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1533b434eb95SMatthew G. Knepley PetscScalar sum; 1534b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1535b434eb95SMatthew G. Knepley 1536b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1537b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1538b434eb95SMatthew G. Knepley #endif 1539b434eb95SMatthew G. Knepley 1540b434eb95SMatthew G. Knepley PetscFunctionBegin; 15419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15429566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15439566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1544b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1545b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1546b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1547b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1548b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1549b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1550b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1551fff043a9SJunchao Zhang aa = a_a + ii[i]; 1552b434eb95SMatthew G. Knepley sum = 0.0; 1553b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1554b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1555b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1556b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1557b434eb95SMatthew G. Knepley } 1558b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15593d3eaba7SBarry Smith ii = a->i; 1560b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1561b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1562b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1563fff043a9SJunchao Zhang aa = a_a + ii[i]; 1564b434eb95SMatthew G. Knepley sum = 0.0; 1565b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1566b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1567b434eb95SMatthew G. Knepley y[i] = sum; 1568b434eb95SMatthew G. Knepley } 1569b434eb95SMatthew G. Knepley } 15709566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15719566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15729566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1575b434eb95SMatthew G. Knepley } 1576b434eb95SMatthew G. Knepley 1577ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1578ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1579d71ae5a4SJacob Faibussowitsch { 1580b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1581b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1582b434eb95SMatthew G. Knepley const PetscScalar *x; 1583fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1584b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1585b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1586b434eb95SMatthew G. Knepley PetscScalar sum; 1587b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1588b434eb95SMatthew G. Knepley 1589b434eb95SMatthew G. Knepley PetscFunctionBegin; 15909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15919566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15929566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1593b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159448a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1595b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1596b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1597b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1598b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1599b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1600b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1601fff043a9SJunchao Zhang aa = a_a + ii[i]; 1602b434eb95SMatthew G. Knepley sum = y[*ridx]; 1603b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1604b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1605b434eb95SMatthew G. Knepley } 1606b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16073d3eaba7SBarry Smith ii = a->i; 1608b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1609b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1610b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1611fff043a9SJunchao Zhang aa = a_a + ii[i]; 1612b434eb95SMatthew G. Knepley sum = y[i]; 1613b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1614b434eb95SMatthew G. Knepley z[i] = sum; 1615b434eb95SMatthew G. Knepley } 1616b434eb95SMatthew G. Knepley } 16179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1622b434eb95SMatthew G. Knepley } 1623b434eb95SMatthew G. Knepley 1624c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1626d71ae5a4SJacob Faibussowitsch { 1627416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1628f15663dcSBarry Smith PetscScalar *y, *z; 1629f15663dcSBarry Smith const PetscScalar *x; 16305914357eSBarry Smith const MatScalar *a_a; 16315914357eSBarry Smith const PetscInt *ii, *ridx = NULL; 16325914357eSBarry Smith PetscInt m = A->rmap->n; 1633ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16349ea0dfa2SSatish Balay 16353a40ed3dSBarry Smith PetscFunctionBegin; 1636b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16379566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1639b215bc84SStefano Zampini } 16409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16419566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16429566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16434eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164448a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164597952fefSHong Zhang m = a->compressedrow.nrows; 164697952fefSHong Zhang ii = a->compressedrow.i; 164797952fefSHong Zhang ridx = a->compressedrow.rindex; 16485914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16495914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16505914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16515914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16525914357eSBarry Smith PetscScalar sum = y[*ridx]; 1653f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165497952fefSHong Zhang z[*ridx++] = sum; 165597952fefSHong Zhang } 165697952fefSHong Zhang } else { /* do not use compressed row format */ 16573d3eaba7SBarry Smith ii = a->i; 1658f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16595914357eSBarry Smith fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z); 1660f15663dcSBarry Smith #else 16615914357eSBarry Smith PetscPragmaUseOMPKernels(parallel for) 16625914357eSBarry Smith for (PetscInt i = 0; i < m; i++) { 16635914357eSBarry Smith PetscInt n = ii[i + 1] - ii[i]; 16645914357eSBarry Smith const PetscInt *aj = a->j + ii[i]; 16655914357eSBarry Smith const PetscScalar *aa = a_a + ii[i]; 16665914357eSBarry Smith PetscScalar sum = y[i]; 1667f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 166817ab2063SBarry Smith z[i] = sum; 166917ab2063SBarry Smith } 167002ab625aSSatish Balay #endif 1671f15663dcSBarry Smith } 16729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16749566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167717ab2063SBarry Smith } 167817ab2063SBarry Smith 167917ab2063SBarry Smith /* 16800b4b7b1cSBarry Smith Adds diagonal pointers to sparse matrix nonzero structure. 168117ab2063SBarry Smith */ 1682d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1683d71ae5a4SJacob Faibussowitsch { 1684416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1685d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1686c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 168717ab2063SBarry Smith 16883a40ed3dSBarry Smith PetscFunctionBegin; 168909f38230SBarry Smith if (!a->diag) { 16909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1691c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169209f38230SBarry Smith } 1693d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1694c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1695c0c07093SJunchao Zhang if (alreadySet) { 1696c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1697c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1698c0c07093SJunchao Zhang } 1699c0c07093SJunchao Zhang 170009f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1701bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1702bfeeae90SHong Zhang if (a->j[j] == i) { 170309f38230SBarry Smith a->diag[i] = j; 170417ab2063SBarry Smith break; 170517ab2063SBarry Smith } 170617ab2063SBarry Smith } 170717ab2063SBarry Smith } 17083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 170917ab2063SBarry Smith } 171017ab2063SBarry Smith 1711ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1712d71ae5a4SJacob Faibussowitsch { 171361ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171461ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171561ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 171661ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 171761ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 171861ecd0c6SBarry Smith 171961ecd0c6SBarry Smith PetscFunctionBegin; 172061ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17229566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172461ecd0c6SBarry Smith } 172561ecd0c6SBarry Smith 172661ecd0c6SBarry Smith if (a->diagonaldense) { 172761ecd0c6SBarry Smith cnt = 0; 172861ecd0c6SBarry Smith } else { 17299566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1731349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173261ecd0c6SBarry Smith cnt++; 173361ecd0c6SBarry Smith mdiag[i] = 1; 173461ecd0c6SBarry Smith } 173561ecd0c6SBarry Smith } 173661ecd0c6SBarry Smith } 173761ecd0c6SBarry Smith if (!cnt) { 17389566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 173961ecd0c6SBarry Smith } else { 1740b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1741b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 17429f0612e4SBarry Smith PetscBool free_a = a->free_a, free_ij = a->free_ij; 17436ea2a7edSJunchao Zhang const PetscScalar *Aa; 17446ea2a7edSJunchao Zhang 17456ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17466ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 174761ecd0c6SBarry Smith 174861ecd0c6SBarry Smith a->a = NULL; 174961ecd0c6SBarry Smith a->j = NULL; 175061ecd0c6SBarry Smith a->i = NULL; 175161ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1752ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175461ecd0c6SBarry Smith 175561ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175661ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17579566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 175848a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1759447d62f5SStefano Zampini } 17609566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17619566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 17629f0612e4SBarry Smith if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda)); 17639f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj)); 17649f0612e4SBarry Smith if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi)); 176561ecd0c6SBarry Smith } 17669566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 176761ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 176961ecd0c6SBarry Smith } 177061ecd0c6SBarry Smith 1771be5855fcSBarry Smith /* 1772be5855fcSBarry Smith Checks for missing diagonals 1773be5855fcSBarry Smith */ 1774d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1775d71ae5a4SJacob Faibussowitsch { 1776be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17777734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1778be5855fcSBarry Smith 1779be5855fcSBarry Smith PetscFunctionBegin; 178009f38230SBarry Smith *missing = PETSC_FALSE; 17817734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 178209f38230SBarry Smith *missing = PETSC_TRUE; 178309f38230SBarry Smith if (d) *d = 0; 17849566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 178509f38230SBarry Smith } else { 178601445905SHong Zhang PetscInt n; 178701445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1788f1e2ffcdSBarry Smith diag = a->diag; 178901445905SHong Zhang for (i = 0; i < n; i++) { 17907734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179109f38230SBarry Smith *missing = PETSC_TRUE; 179209f38230SBarry Smith if (d) *d = i; 17939566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1794358d2f5dSShri Abhyankar break; 179509f38230SBarry Smith } 1796be5855fcSBarry Smith } 1797be5855fcSBarry Smith } 17983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1799be5855fcSBarry Smith } 1800be5855fcSBarry Smith 18010da83c2eSBarry Smith #include <petscblaslapack.h> 18020da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18030da83c2eSBarry Smith 18040da83c2eSBarry Smith /* 18050da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18060da83c2eSBarry Smith */ 1807ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1808d71ae5a4SJacob Faibussowitsch { 18090da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18100da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18110da83c2eSBarry Smith const PetscReal shift = 0.0; 18120da83c2eSBarry Smith PetscInt ipvt[5]; 18134e208921SJed Brown PetscCount flops = 0; 18140da83c2eSBarry Smith PetscScalar work[25], *v_work; 18150da83c2eSBarry Smith 18160da83c2eSBarry Smith PetscFunctionBegin; 18170da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18180da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 181908401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1820ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 182248a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18230da83c2eSBarry Smith ncnt = 0; 18240da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18250da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18269566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18270da83c2eSBarry Smith switch (bsizes[i]) { 1828d71ae5a4SJacob Faibussowitsch case 1: 1829d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1830d71ae5a4SJacob Faibussowitsch break; 18310da83c2eSBarry Smith case 2: 18329566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18330da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18349566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18350da83c2eSBarry Smith break; 18360da83c2eSBarry Smith case 3: 18379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18380da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18399566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18400da83c2eSBarry Smith break; 18410da83c2eSBarry Smith case 4: 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18430da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18450da83c2eSBarry Smith break; 18460da83c2eSBarry Smith case 5: 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18480da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18500da83c2eSBarry Smith break; 18510da83c2eSBarry Smith case 6: 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18530da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18550da83c2eSBarry Smith break; 18560da83c2eSBarry Smith case 7: 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18580da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18600da83c2eSBarry Smith break; 18610da83c2eSBarry Smith default: 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18630da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18650da83c2eSBarry Smith } 18660da83c2eSBarry Smith ncnt += bsizes[i]; 18670da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 1868baa50dc0SBrad Aagaard flops += 2 * PetscPowInt64(bsizes[i], 3) / 3; 18690da83c2eSBarry Smith } 18703ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187148a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18729566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18740da83c2eSBarry Smith } 18750da83c2eSBarry Smith 1876422a814eSBarry Smith /* 1877422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1878422a814eSBarry Smith */ 1879ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1880d71ae5a4SJacob Faibussowitsch { 188171f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1882d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18832e5835c6SStefano Zampini const MatScalar *v; 188454f21887SBarry Smith PetscScalar *idiag, *mdiag; 188571f1c65dSBarry Smith 188671f1c65dSBarry Smith PetscFunctionBegin; 18873ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18889566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 188971f1c65dSBarry Smith diag = a->diag; 18904dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18912e5835c6SStefano Zampini 189271f1c65dSBarry Smith mdiag = a->mdiag; 189371f1c65dSBarry Smith idiag = a->idiag; 18949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1895422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 189671f1c65dSBarry Smith for (i = 0; i < m; i++) { 189771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1898899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1899899639b0SHong Zhang if (PetscRealPart(fshift)) { 19009566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19017b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19027b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19037b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 190498921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1905899639b0SHong Zhang } 190671f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 190771f1c65dSBarry Smith } 19089566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 190971f1c65dSBarry Smith } else { 191071f1c65dSBarry Smith for (i = 0; i < m; i++) { 191171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 191271f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 191371f1c65dSBarry Smith } 19149566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 191571f1c65dSBarry Smith } 191671f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 191971f1c65dSBarry Smith } 192071f1c65dSBarry Smith 1921d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1922d71ae5a4SJacob Faibussowitsch { 1923416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1924e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19252e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 192654f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19273d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 192897f1f81fSBarry Smith const PetscInt *idx, *diag; 192917ab2063SBarry Smith 19303a40ed3dSBarry Smith PetscFunctionBegin; 1931b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19329566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1934b215bc84SStefano Zampini } 1935b965ef7fSBarry Smith its = its * lits; 193691723122SBarry Smith 193771f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19389566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 193971f1c65dSBarry Smith a->fshift = fshift; 194071f1c65dSBarry Smith a->omega = omega; 1941ed480e8bSBarry Smith 194271f1c65dSBarry Smith diag = a->diag; 194371f1c65dSBarry Smith t = a->ssor_work; 1944ed480e8bSBarry Smith idiag = a->idiag; 194571f1c65dSBarry Smith mdiag = a->mdiag; 1946ed480e8bSBarry Smith 19479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19489566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19499566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1950ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 195117ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 195217ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1953ed480e8bSBarry Smith bs = b; 195417ab2063SBarry Smith for (i = 0; i < m; i++) { 195571f1c65dSBarry Smith d = fshift + mdiag[i]; 1956416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1957ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19582e5835c6SStefano Zampini v = aa + diag[i] + 1; 195917ab2063SBarry Smith sum = b[i] * d / omega; 1960003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 196117ab2063SBarry Smith x[i] = sum; 196217ab2063SBarry Smith } 19639566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19669566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 196817ab2063SBarry Smith } 1969c783ea89SBarry Smith 197008401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1971f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19724c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1973887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 197417ab2063SBarry Smith 197517ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 197617ab2063SBarry Smith 1977887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 197817ab2063SBarry Smith */ 197917ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198017ab2063SBarry Smith 198117ab2063SBarry Smith /* x = (E + U)^{-1} b */ 198217ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1983416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1984ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19852e5835c6SStefano Zampini v = aa + diag[i] + 1; 198617ab2063SBarry Smith sum = b[i]; 1987e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1988ed480e8bSBarry Smith x[i] = sum * idiag[i]; 198917ab2063SBarry Smith } 199017ab2063SBarry Smith 199117ab2063SBarry Smith /* t = b - (2*E - D)x */ 19922e5835c6SStefano Zampini v = aa; 19932205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 199417ab2063SBarry Smith 199517ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1996ed480e8bSBarry Smith ts = t; 1997416022c9SBarry Smith diag = a->diag; 199817ab2063SBarry Smith for (i = 0; i < m; i++) { 1999416022c9SBarry Smith n = diag[i] - a->i[i]; 2000ed480e8bSBarry Smith idx = a->j + a->i[i]; 20012e5835c6SStefano Zampini v = aa + a->i[i]; 200217ab2063SBarry Smith sum = t[i]; 2003003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2004ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2005733d66baSBarry Smith /* x = x + t */ 2006733d66baSBarry Smith x[i] += t[i]; 200717ab2063SBarry Smith } 200817ab2063SBarry Smith 20099566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20109566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 201317ab2063SBarry Smith } 201417ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 201517ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 201617ab2063SBarry Smith for (i = 0; i < m; i++) { 2017416022c9SBarry Smith n = diag[i] - a->i[i]; 2018ed480e8bSBarry Smith idx = a->j + a->i[i]; 20192e5835c6SStefano Zampini v = aa + a->i[i]; 202017ab2063SBarry Smith sum = b[i]; 2021e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20225c99c7daSBarry Smith t[i] = sum; 2023ed480e8bSBarry Smith x[i] = sum * idiag[i]; 202417ab2063SBarry Smith } 20255c99c7daSBarry Smith xb = t; 20269566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20273a40ed3dSBarry Smith } else xb = b; 202817ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 202917ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2030416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2031ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20322e5835c6SStefano Zampini v = aa + diag[i] + 1; 203317ab2063SBarry Smith sum = xb[i]; 2034e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20355c99c7daSBarry Smith if (xb == b) { 2036ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20375c99c7daSBarry Smith } else { 2038b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 203917ab2063SBarry Smith } 20405c99c7daSBarry Smith } 20419566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 204217ab2063SBarry Smith } 204317ab2063SBarry Smith its--; 204417ab2063SBarry Smith } 204517ab2063SBarry Smith while (its--) { 204617ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 204717ab2063SBarry Smith for (i = 0; i < m; i++) { 2048b19a5dc2SMark Adams /* lower */ 2049b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2050ed480e8bSBarry Smith idx = a->j + a->i[i]; 20512e5835c6SStefano Zampini v = aa + a->i[i]; 205217ab2063SBarry Smith sum = b[i]; 2053e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2054b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2055b19a5dc2SMark Adams /* upper */ 2056b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2057b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20582e5835c6SStefano Zampini v = aa + diag[i] + 1; 2059b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2060b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 206117ab2063SBarry Smith } 2062b19a5dc2SMark Adams xb = t; 20639566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2064b19a5dc2SMark Adams } else xb = b; 206517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 206617ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2067b19a5dc2SMark Adams sum = xb[i]; 2068b19a5dc2SMark Adams if (xb == b) { 2069b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2070416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2071ed480e8bSBarry Smith idx = a->j + a->i[i]; 20722e5835c6SStefano Zampini v = aa + a->i[i]; 2073e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2074ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2075b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2076b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2077b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20782e5835c6SStefano Zampini v = aa + diag[i] + 1; 2079b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2080b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 208117ab2063SBarry Smith } 2082b19a5dc2SMark Adams } 2083b19a5dc2SMark Adams if (xb == b) { 20849566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2085b19a5dc2SMark Adams } else { 20869566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2087b19a5dc2SMark Adams } 208817ab2063SBarry Smith } 208917ab2063SBarry Smith } 20909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 20919566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20929566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 209417ab2063SBarry Smith } 209517ab2063SBarry Smith 2096ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2097d71ae5a4SJacob Faibussowitsch { 2098416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 20994e220ebcSLois Curfman McInnes 21003a40ed3dSBarry Smith PetscFunctionBegin; 21014e220ebcSLois Curfman McInnes info->block_size = 1.0; 21023966268fSBarry Smith info->nz_allocated = a->maxnz; 21033966268fSBarry Smith info->nz_used = a->nz; 21043966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21053966268fSBarry Smith info->assemblies = A->num_ass; 21063966268fSBarry Smith info->mallocs = A->info.mallocs; 21074dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2108d5f3da31SBarry Smith if (A->factortype) { 21094e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21104e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21114e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21124e220ebcSLois Curfman McInnes } else { 21134e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21144e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21154e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21164e220ebcSLois Curfman McInnes } 21173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 211817ab2063SBarry Smith } 211917ab2063SBarry Smith 2120ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2121d71ae5a4SJacob Faibussowitsch { 2122416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2123c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 212497b48c8fSBarry Smith const PetscScalar *xx; 21252e5835c6SStefano Zampini PetscScalar *bb, *aa; 2126c7da8527SEric Chamberland PetscInt d = 0; 212717ab2063SBarry Smith 21283a40ed3dSBarry Smith PetscFunctionBegin; 212997b48c8fSBarry Smith if (x && b) { 21309566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21319566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 213297b48c8fSBarry Smith for (i = 0; i < N; i++) { 2133aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2134447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 213597b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 213697b48c8fSBarry Smith } 21379566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21389566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 213997b48c8fSBarry Smith } 214097b48c8fSBarry Smith 21419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2142a9817697SBarry Smith if (a->keepnonzeropattern) { 2143f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2144aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21459566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2146f1e2ffcdSBarry Smith } 2147f4df32b1SMatthew Knepley if (diag != 0.0) { 2148c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2149c7da8527SEric Chamberland d = rows[i]; 2150447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215108401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2152c7da8527SEric Chamberland } 2153f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2154447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21552e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2156f1e2ffcdSBarry Smith } 2157f1e2ffcdSBarry Smith } 2158f1e2ffcdSBarry Smith } else { 2159f4df32b1SMatthew Knepley if (diag != 0.0) { 216017ab2063SBarry Smith for (i = 0; i < N; i++) { 2161aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21627ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2163447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2164447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2165447d62f5SStefano Zampini } else { 2166416022c9SBarry Smith a->ilen[rows[i]] = 1; 21672e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2168bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2169447d62f5SStefano Zampini } 2170447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21719566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 217217ab2063SBarry Smith } 217317ab2063SBarry Smith } 21743a40ed3dSBarry Smith } else { 217517ab2063SBarry Smith for (i = 0; i < N; i++) { 2176aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2177416022c9SBarry Smith a->ilen[rows[i]] = 0; 217817ab2063SBarry Smith } 217917ab2063SBarry Smith } 2180e56f5c9eSBarry Smith A->nonzerostate++; 2181f1e2ffcdSBarry Smith } 21829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2183dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218517ab2063SBarry Smith } 218617ab2063SBarry Smith 2187ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2188d71ae5a4SJacob Faibussowitsch { 21896e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21906e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 21912b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 21926e169961SBarry Smith const PetscScalar *xx; 21932e5835c6SStefano Zampini PetscScalar *bb, *aa; 21946e169961SBarry Smith 21956e169961SBarry Smith PetscFunctionBegin; 21963ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 21979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 21986e169961SBarry Smith if (x && b) { 21999566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22009566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22012b40b63fSBarry Smith vecs = PETSC_TRUE; 22026e169961SBarry Smith } 22039566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22046e169961SBarry Smith for (i = 0; i < N; i++) { 2205aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 22068e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22072205254eSKarl Rupp 22086e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22096e169961SBarry Smith } 22106e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22116e169961SBarry Smith if (!zeroed[i]) { 22126e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22134cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22142e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22152e5835c6SStefano Zampini aa[j] = 0.0; 22166e169961SBarry Smith } 22176e169961SBarry Smith } 22184cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22196e169961SBarry Smith } 22206e169961SBarry Smith if (x && b) { 22219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22229566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22236e169961SBarry Smith } 22249566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22256e169961SBarry Smith if (diag != 0.0) { 22269566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22271d5a398dSstefano_zampini if (missing) { 22281d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22294cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2230aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22319566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22321d5a398dSstefano_zampini } 22331d5a398dSstefano_zampini } else { 2234ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22356e169961SBarry Smith } 22361d5a398dSstefano_zampini } 22379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2238dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22406e169961SBarry Smith } 22416e169961SBarry Smith 2242d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2243d71ae5a4SJacob Faibussowitsch { 2244fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2245fff043a9SJunchao Zhang const PetscScalar *aa; 224617ab2063SBarry Smith 22473a40ed3dSBarry Smith PetscFunctionBegin; 22489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2249416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 22508e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 225117ab2063SBarry Smith if (idx) { 22525c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2253f4259b30SLisandro Dalcin else *idx = NULL; 225417ab2063SBarry Smith } 22559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225717ab2063SBarry Smith } 225817ab2063SBarry Smith 2259d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2260d71ae5a4SJacob Faibussowitsch { 22613a40ed3dSBarry Smith PetscFunctionBegin; 22623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226317ab2063SBarry Smith } 226417ab2063SBarry Smith 2265ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2266d71ae5a4SJacob Faibussowitsch { 2267416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22682e5835c6SStefano Zampini const MatScalar *v; 226936db0b34SBarry Smith PetscReal sum = 0.0; 227097f1f81fSBarry Smith PetscInt i, j; 227117ab2063SBarry Smith 22723a40ed3dSBarry Smith PetscFunctionBegin; 22739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 227417ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2275570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2276570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2277792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2278570b7f6dSBarry Smith #else 2279416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22809371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22819371c9d4SSatish Balay v++; 228217ab2063SBarry Smith } 22838f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2284570b7f6dSBarry Smith #endif 22859566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22863a40ed3dSBarry Smith } else if (type == NORM_1) { 228736db0b34SBarry Smith PetscReal *tmp; 228897f1f81fSBarry Smith PetscInt *jj = a->j; 22899566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2290064f8208SBarry Smith *nrm = 0.0; 2291416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 22929371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 22939371c9d4SSatish Balay v++; 229417ab2063SBarry Smith } 2295d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2296064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 229717ab2063SBarry Smith } 22989566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 22999566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23003a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2301064f8208SBarry Smith *nrm = 0.0; 2302d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 23038e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 230417ab2063SBarry Smith sum = 0.0; 2305416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23069371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23079371c9d4SSatish Balay v2++; 230817ab2063SBarry Smith } 2309064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231017ab2063SBarry Smith } 23119566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2312f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231517ab2063SBarry Smith } 231617ab2063SBarry Smith 2317ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2318d71ae5a4SJacob Faibussowitsch { 23193d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232054f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23212e5835c6SStefano Zampini const MatScalar *va, *vb; 232297f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2323cd0d46ebSvictorle 2324cd0d46ebSvictorle PetscFunctionBegin; 23259566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23269566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23275485867bSBarry Smith if (ma != nb || na != mb) { 23285485867bSBarry Smith *f = PETSC_FALSE; 23293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23305485867bSBarry Smith } 23319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23339371c9d4SSatish Balay aii = aij->i; 23349371c9d4SSatish Balay bii = bij->i; 23359371c9d4SSatish Balay adx = aij->j; 23369371c9d4SSatish Balay bdx = bij->j; 23379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2339cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2340cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2341cd0d46ebSvictorle 2342cd0d46ebSvictorle *f = PETSC_TRUE; 2343cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2344cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 234597f1f81fSBarry Smith PetscInt idc, idr; 23465485867bSBarry Smith PetscScalar vc, vr; 2347cd0d46ebSvictorle /* column/row index/value */ 23485485867bSBarry Smith idc = adx[aptr[i]]; 23495485867bSBarry Smith idr = bdx[bptr[idc]]; 23505485867bSBarry Smith vc = va[aptr[i]]; 23515485867bSBarry Smith vr = vb[bptr[idc]]; 23525485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23535485867bSBarry Smith *f = PETSC_FALSE; 23545485867bSBarry Smith goto done; 2355cd0d46ebSvictorle } else { 23565485867bSBarry Smith aptr[i]++; 23575485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2358cd0d46ebSvictorle } 2359cd0d46ebSvictorle } 2360cd0d46ebSvictorle } 2361cd0d46ebSvictorle done: 23629566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23639566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle 2369ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2370d71ae5a4SJacob Faibussowitsch { 23713d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 237254f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 237354f21887SBarry Smith MatScalar *va, *vb; 23741cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23751cbb95d3SBarry Smith 23761cbb95d3SBarry Smith PetscFunctionBegin; 23779566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23789566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23791cbb95d3SBarry Smith if (ma != nb || na != mb) { 23801cbb95d3SBarry Smith *f = PETSC_FALSE; 23813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23821cbb95d3SBarry Smith } 23839371c9d4SSatish Balay aii = aij->i; 23849371c9d4SSatish Balay bii = bij->i; 23859371c9d4SSatish Balay adx = aij->j; 23869371c9d4SSatish Balay bdx = bij->j; 23879371c9d4SSatish Balay va = aij->a; 23889371c9d4SSatish Balay vb = bij->a; 23899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 23911cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 23921cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 23931cbb95d3SBarry Smith 23941cbb95d3SBarry Smith *f = PETSC_TRUE; 23951cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 23961cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 23971cbb95d3SBarry Smith PetscInt idc, idr; 23981cbb95d3SBarry Smith PetscScalar vc, vr; 23991cbb95d3SBarry Smith /* column/row index/value */ 24001cbb95d3SBarry Smith idc = adx[aptr[i]]; 24011cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24021cbb95d3SBarry Smith vc = va[aptr[i]]; 24031cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24041cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24051cbb95d3SBarry Smith *f = PETSC_FALSE; 24061cbb95d3SBarry Smith goto done; 24071cbb95d3SBarry Smith } else { 24081cbb95d3SBarry Smith aptr[i]++; 24091cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24101cbb95d3SBarry Smith } 24111cbb95d3SBarry Smith } 24121cbb95d3SBarry Smith } 24131cbb95d3SBarry Smith done: 24149566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24159566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24171cbb95d3SBarry Smith } 24181cbb95d3SBarry Smith 2419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2420d71ae5a4SJacob Faibussowitsch { 2421416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2422fff8e43fSBarry Smith const PetscScalar *l, *r; 2423fff8e43fSBarry Smith PetscScalar x; 242454f21887SBarry Smith MatScalar *v; 2425fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2426fff8e43fSBarry Smith const PetscInt *jj; 242717ab2063SBarry Smith 24283a40ed3dSBarry Smith PetscFunctionBegin; 242917ab2063SBarry Smith if (ll) { 24303ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24313ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24329566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 243308401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24349566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 243617ab2063SBarry Smith for (i = 0; i < m; i++) { 243717ab2063SBarry Smith x = l[i]; 2438416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24392205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 244017ab2063SBarry Smith } 24419566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24429566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 244417ab2063SBarry Smith } 244517ab2063SBarry Smith if (rr) { 24469566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 244708401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24489566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24502e5835c6SStefano Zampini jj = a->j; 24512205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24539566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24549566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 245517ab2063SBarry Smith } 24569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 245817ab2063SBarry Smith } 245917ab2063SBarry Smith 2460d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2461d71ae5a4SJacob Faibussowitsch { 2462db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2463d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 246497f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24655d0c19d7SBarry Smith const PetscInt *irow, *icol; 24662e5835c6SStefano Zampini const PetscScalar *aa; 24675d0c19d7SBarry Smith PetscInt nrows, ncols; 246897f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2469fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2470416022c9SBarry Smith Mat C; 2471cdc6f3adSToby Isaac PetscBool stride; 247217ab2063SBarry Smith 24733a40ed3dSBarry Smith PetscFunctionBegin; 24749566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24759566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24769566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 247717ab2063SBarry Smith 24789566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2479ff718158SBarry Smith if (stride) { 24809566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2481ff718158SBarry Smith } else { 2482ff718158SBarry Smith first = 0; 2483ff718158SBarry Smith step = 0; 2484ff718158SBarry Smith } 2485fee21e36SBarry Smith if (stride && step == 1) { 248602834360SBarry Smith /* special case of contiguous rows */ 24879566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 248802834360SBarry Smith /* loop over new rows determining lens and starting points */ 248902834360SBarry Smith for (i = 0; i < nrows; i++) { 2490bfeeae90SHong Zhang kstart = ai[irow[i]]; 2491a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2492a91a9bebSLisandro Dalcin starts[i] = kstart; 249302834360SBarry Smith for (k = kstart; k < kend; k++) { 2494bfeeae90SHong Zhang if (aj[k] >= first) { 249502834360SBarry Smith starts[i] = k; 249602834360SBarry Smith break; 249702834360SBarry Smith } 249802834360SBarry Smith } 2499a2744918SBarry Smith sum = 0; 250002834360SBarry Smith while (k < kend) { 2501bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2502a2744918SBarry Smith sum++; 250302834360SBarry Smith } 2504a2744918SBarry Smith lens[i] = sum; 250502834360SBarry Smith } 250602834360SBarry Smith /* create submatrix */ 2507cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 250897f1f81fSBarry Smith PetscInt n_cols, n_rows; 25099566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2510aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25119566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 251208480c60SBarry Smith C = *B; 25133a40ed3dSBarry Smith } else { 25143bef6203SJed Brown PetscInt rbs, cbs; 25159566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25169566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25179566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25189566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25199566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25209566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 252208480c60SBarry Smith } 2523db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2524db02288aSLois Curfman McInnes 252502834360SBarry Smith /* loop over rows inserting into submatrix */ 2526fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2527db02288aSLois Curfman McInnes j_new = c->j; 2528db02288aSLois Curfman McInnes i_new = c->i; 25299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 253002834360SBarry Smith for (i = 0; i < nrows; i++) { 2531a2744918SBarry Smith ii = starts[i]; 2532a2744918SBarry Smith lensi = lens[i]; 2533810441c8SPierre Jolivet if (lensi) { 2534ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25359566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2536a2744918SBarry Smith a_new += lensi; 2537810441c8SPierre Jolivet } 2538a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2539a2744918SBarry Smith c->ilen[i] = lensi; 254002834360SBarry Smith } 2541fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25439566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25443a40ed3dSBarry Smith } else { 25459566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25469566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25484dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25496bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25504dcab191SBarry Smith smap[icol[i]] = i + 1; 25514dcab191SBarry Smith } 25524dcab191SBarry Smith 255302834360SBarry Smith /* determine lens of each row */ 255402834360SBarry Smith for (i = 0; i < nrows; i++) { 2555bfeeae90SHong Zhang kstart = ai[irow[i]]; 255602834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 255702834360SBarry Smith lens[i] = 0; 255802834360SBarry Smith for (k = kstart; k < kend; k++) { 2559ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 256002834360SBarry Smith } 256102834360SBarry Smith } 256217ab2063SBarry Smith /* Create and fill new matrix */ 2563a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2564ace3abfcSBarry Smith PetscBool equal; 25650f5bd95cSBarry Smith 256699141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2567aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25689566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2569fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25709566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 257108480c60SBarry Smith C = *B; 25723a40ed3dSBarry Smith } else { 25733bef6203SJed Brown PetscInt rbs, cbs; 25749566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25759566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25769566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25779566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 257837a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25799566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 258108480c60SBarry Smith } 25829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2583fb3c7e2dSJunchao Zhang 2584f4f49eeaSPierre Jolivet c = (Mat_SeqAIJ *)C->data; 2585fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 258617ab2063SBarry Smith for (i = 0; i < nrows; i++) { 258799141d43SSatish Balay row = irow[i]; 2588bfeeae90SHong Zhang kstart = ai[row]; 258999141d43SSatish Balay kend = kstart + a->ilen[row]; 2590bfeeae90SHong Zhang mat_i = c->i[i]; 25918e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 25928e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 259399141d43SSatish Balay mat_ilen = c->ilen + i; 259417ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2595bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2596ed480e8bSBarry Smith *mat_j++ = tcol - 1; 25972e5835c6SStefano Zampini *mat_a++ = aa[k]; 259899141d43SSatish Balay (*mat_ilen)++; 259917ab2063SBarry Smith } 260017ab2063SBarry Smith } 260117ab2063SBarry Smith } 26029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 260302834360SBarry Smith /* Free work space */ 26049566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26059566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26069566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2607cdc6f3adSToby Isaac /* sort */ 2608cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2609cdc6f3adSToby Isaac PetscInt ilen; 2610cdc6f3adSToby Isaac 2611cdc6f3adSToby Isaac mat_i = c->i[i]; 26128e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 26138e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2614cdc6f3adSToby Isaac ilen = c->ilen[i]; 26159566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2616cdc6f3adSToby Isaac } 2617fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 261802834360SBarry Smith } 26198c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26209566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2621305c6ccfSStefano Zampini #endif 26229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 262417ab2063SBarry Smith 26259566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2626416022c9SBarry Smith *B = C; 26273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 262817ab2063SBarry Smith } 262917ab2063SBarry Smith 2630ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2631d71ae5a4SJacob Faibussowitsch { 263282d44351SHong Zhang Mat B; 263382d44351SHong Zhang 263482d44351SHong Zhang PetscFunctionBegin; 2635c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26369566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26389566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26399566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26409566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 264182d44351SHong Zhang *subMat = B; 2642c2d650bdSHong Zhang } else { 26439566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2644c2d650bdSHong Zhang } 26453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 264682d44351SHong Zhang } 264782d44351SHong Zhang 2648ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2649d71ae5a4SJacob Faibussowitsch { 265063b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 265163b91edcSBarry Smith Mat outA; 2652ace3abfcSBarry Smith PetscBool row_identity, col_identity; 265363b91edcSBarry Smith 26543a40ed3dSBarry Smith PetscFunctionBegin; 265508401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26561df811f5SHong Zhang 26579566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26589566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2659a871dcd8SBarry Smith 266063b91edcSBarry Smith outA = inA; 2661d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26629566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26639566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26642205254eSKarl Rupp 26659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26672205254eSKarl Rupp 2668c3122656SLisandro Dalcin a->row = row; 26692205254eSKarl Rupp 26709566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26719566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26722205254eSKarl Rupp 2673c3122656SLisandro Dalcin a->col = col; 267463b91edcSBarry Smith 267536db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26769566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 26779566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2678f0ec6fceSSatish Balay 267994a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 26809566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 268194a9d846SBarry Smith } 268263b91edcSBarry Smith 26839566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2684137fb511SHong Zhang if (row_identity && col_identity) { 26859566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2686137fb511SHong Zhang } else { 26879566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2688137fb511SHong Zhang } 26893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2690a871dcd8SBarry Smith } 2691a871dcd8SBarry Smith 2692d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2693d71ae5a4SJacob Faibussowitsch { 2694f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2695dfa0f9e5SStefano Zampini PetscScalar *v; 2696c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 26973a40ed3dSBarry Smith 26983a40ed3dSBarry Smith PetscFunctionBegin; 26999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27009566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2701792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2706f0b747eeSBarry Smith } 2707f0b747eeSBarry Smith 2708d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2709d71ae5a4SJacob Faibussowitsch { 271016b64355SHong Zhang PetscInt i; 271116b64355SHong Zhang 271216b64355SHong Zhang PetscFunctionBegin; 271316b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27149566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 271516b64355SHong Zhang 271648a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27179566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 271816b64355SHong Zhang 271916b64355SHong Zhang if (submatj->rbuf1) { 27209566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27219566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 272216b64355SHong Zhang } 272316b64355SHong Zhang 272448a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27259566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27269566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 272716b64355SHong Zhang } 272816b64355SHong Zhang 272916b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2730eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27319566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27329566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 273316b64355SHong Zhang #else 27349566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 273516b64355SHong Zhang #endif 273616b64355SHong Zhang 273716b64355SHong Zhang if (!submatj->allcolumns) { 273816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2739eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 274016b64355SHong Zhang #else 27419566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 274216b64355SHong Zhang #endif 274316b64355SHong Zhang } 27449566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 274516b64355SHong Zhang 27469566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 274816b64355SHong Zhang } 274916b64355SHong Zhang 2750d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2751d71ae5a4SJacob Faibussowitsch { 275216b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27535c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 275416b64355SHong Zhang 275516b64355SHong Zhang PetscFunctionBegin; 27569566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27579566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 275916b64355SHong Zhang } 276016b64355SHong Zhang 276189a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2762ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2763d71ae5a4SJacob Faibussowitsch { 27642d033e1fSHong Zhang PetscInt i; 27650fb991dcSHong Zhang Mat C; 27660fb991dcSHong Zhang Mat_SeqAIJ *c; 27670fb991dcSHong Zhang Mat_SubSppt *submatj; 27682d033e1fSHong Zhang 27692d033e1fSHong Zhang PetscFunctionBegin; 27702d033e1fSHong Zhang for (i = 0; i < n; i++) { 27710fb991dcSHong Zhang C = (*mat)[i]; 27720fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27730fb991dcSHong Zhang submatj = c->submatis1; 27742d033e1fSHong Zhang if (submatj) { 2775682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 277626cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 27779566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27789566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27799566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 27803faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 27819566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 27829566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 27839566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2784682e4c99SStefano Zampini } 27852d033e1fSHong Zhang } else { 27869566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 27872d033e1fSHong Zhang } 27882d033e1fSHong Zhang } 278986e85357SHong Zhang 279063a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 27919566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 279263a75b2aSHong Zhang 27939566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 27943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 27952d033e1fSHong Zhang } 27962d033e1fSHong Zhang 2797ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2798d71ae5a4SJacob Faibussowitsch { 279997f1f81fSBarry Smith PetscInt i; 2800cddf8d76SBarry Smith 28013a40ed3dSBarry Smith PetscFunctionBegin; 280248a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2803cddf8d76SBarry Smith 280448a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2806cddf8d76SBarry Smith } 2807cddf8d76SBarry Smith 2808ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2809d71ae5a4SJacob Faibussowitsch { 2810e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28119a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28125d0c19d7SBarry Smith const PetscInt *idx; 28139a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2814f1af5d2fSBarry Smith PetscBT table; 2815bbd702dbSSatish Balay 28163a40ed3dSBarry Smith PetscFunctionBegin; 28179a88ca10SBarry Smith m = A->rmap->n / bs; 2818e4d965acSSatish Balay ai = a->i; 2819bfeeae90SHong Zhang aj = a->j; 28208a047759SSatish Balay 282108401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 282206763907SSatish Balay 28239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28249566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 282506763907SSatish Balay 2826e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2827b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2828e4d965acSSatish Balay isz = 0; 28299566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2830e4d965acSSatish Balay 2831e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28329566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28339566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2834e4d965acSSatish Balay 28359a88ca10SBarry Smith if (bs > 1) { 28369a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28379a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28389a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28399a88ca10SBarry Smith } 28409a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28419a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28429a88ca10SBarry Smith 28439a88ca10SBarry Smith k = 0; 28449a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28459a88ca10SBarry Smith n = isz; 28469a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28479a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28489a88ca10SBarry Smith row = bs * nidx[k] + ll; 28499a88ca10SBarry Smith start = ai[row]; 28509a88ca10SBarry Smith end = ai[row + 1]; 28519a88ca10SBarry Smith for (l = start; l < end; l++) { 28529a88ca10SBarry Smith val = aj[l] / bs; 28539a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28549a88ca10SBarry Smith } 28559a88ca10SBarry Smith } 28569a88ca10SBarry Smith } 28579a88ca10SBarry Smith } 285857508eceSPierre Jolivet PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i)); 28599a88ca10SBarry Smith } else { 2860dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2861e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28622205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28634dcbc457SBarry Smith } 28649566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28659566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2866e4d965acSSatish Balay 286704a348a9SBarry Smith k = 0; 286804a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 286904a348a9SBarry Smith n = isz; 287006763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2871e4d965acSSatish Balay row = nidx[k]; 2872e4d965acSSatish Balay start = ai[row]; 2873e4d965acSSatish Balay end = ai[row + 1]; 287404a348a9SBarry Smith for (l = start; l < end; l++) { 2875efb16452SHong Zhang val = aj[l]; 28762205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2877e4d965acSSatish Balay } 2878e4d965acSSatish Balay } 2879e4d965acSSatish Balay } 288057508eceSPierre Jolivet PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i)); 2881e4d965acSSatish Balay } 28829a88ca10SBarry Smith } 28839566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 28849566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 28853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28864dcbc457SBarry Smith } 288717ab2063SBarry Smith 2888ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2889d71ae5a4SJacob Faibussowitsch { 28900513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28913b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 28925d0c19d7SBarry Smith const PetscInt *row, *col; 28935d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 289456cd22aeSBarry Smith IS icolp, irowp; 28950298fd71SBarry Smith PetscInt *cwork = NULL; 28960298fd71SBarry Smith PetscScalar *vwork = NULL; 28970513a670SBarry Smith 28983a40ed3dSBarry Smith PetscFunctionBegin; 28999566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29009566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29019566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29029566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29030513a670SBarry Smith 29040513a670SBarry Smith /* determine lengths of permuted rows */ 29059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29062205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29079566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29089566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29099566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29109566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29119566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29129566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29130513a670SBarry Smith 29149566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29150513a670SBarry Smith for (i = 0; i < m; i++) { 29169566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29172205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29189566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29199566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29200513a670SBarry Smith } 29219566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29222205254eSKarl Rupp 29233c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29242205254eSKarl Rupp 29258c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29269566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29279fe5e383SStefano Zampini #endif 29289566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29299566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29309566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29319566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29329566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29339566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 293448a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29360513a670SBarry Smith } 29370513a670SBarry Smith 2938d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2939d71ae5a4SJacob Faibussowitsch { 2940cb5b572fSBarry Smith PetscFunctionBegin; 294133f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 294233f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2943be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2944be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29452e5835c6SStefano Zampini const PetscScalar *aa; 2946be6bf707SBarry Smith 29479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 294808401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29499566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29509566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29519566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2952cb5b572fSBarry Smith } else { 29539566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2954cb5b572fSBarry Smith } 29553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2956cb5b572fSBarry Smith } 2957cb5b572fSBarry Smith 2958d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2959d71ae5a4SJacob Faibussowitsch { 29606c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29616e111a19SKarl Rupp 29626c0721eeSBarry Smith PetscFunctionBegin; 29636c0721eeSBarry Smith *array = a->a; 29643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29656c0721eeSBarry Smith } 29666c0721eeSBarry Smith 2967d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2968d71ae5a4SJacob Faibussowitsch { 29696c0721eeSBarry Smith PetscFunctionBegin; 2970f38c1e66SStefano Zampini *array = NULL; 29713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29726c0721eeSBarry Smith } 2973273d9f13SBarry Smith 29748229c054SShri Abhyankar /* 29758229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29768229c054SShri Abhyankar have different nonzero structure. 29778229c054SShri Abhyankar */ 2978d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 2979d71ae5a4SJacob Faibussowitsch { 2980b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 2981ec7775f6SShri Abhyankar 2982ec7775f6SShri Abhyankar PetscFunctionBegin; 2983ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2984ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 29858e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 2986b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 2987b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 29888af7cee1SJed Brown nnz[i] = 0; 29898af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 2990b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2991b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 29928af7cee1SJed Brown nnz[i]++; 29938af7cee1SJed Brown } 29948af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 2995ec7775f6SShri Abhyankar } 29963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2997ec7775f6SShri Abhyankar } 2998ec7775f6SShri Abhyankar 2999d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3000d71ae5a4SJacob Faibussowitsch { 3001b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3002b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3003b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3004b264fe52SHong Zhang 3005b264fe52SHong Zhang PetscFunctionBegin; 3006b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30079566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3009b264fe52SHong Zhang } 3010b264fe52SHong Zhang 3011d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3012d71ae5a4SJacob Faibussowitsch { 3013ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3014ac90fabeSBarry Smith 3015ac90fabeSBarry Smith PetscFunctionBegin; 3016134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3017134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3018134adf20SPierre Jolivet if (e) { 30199566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 302081fa06acSBarry Smith if (e) { 30219566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3022134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 302381fa06acSBarry Smith } 302481fa06acSBarry Smith } 302554c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 302681fa06acSBarry Smith } 3027ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30282e5835c6SStefano Zampini const PetscScalar *xa; 30292e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 303081fa06acSBarry Smith PetscBLASInt one = 1, bnz; 303181fa06acSBarry Smith 30329566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3035792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30389566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30409566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3041ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30429566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3043ac90fabeSBarry Smith } else { 30448229c054SShri Abhyankar Mat B; 30458229c054SShri Abhyankar PetscInt *nnz; 30469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30479566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30489566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30499566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30509566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30519566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30539566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30549566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30559bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30569566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3057ac90fabeSBarry Smith } 30583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3059ac90fabeSBarry Smith } 3060ac90fabeSBarry Smith 3061d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3062d71ae5a4SJacob Faibussowitsch { 3063354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3064354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3065354c94deSBarry Smith PetscInt i, nz; 3066354c94deSBarry Smith PetscScalar *a; 3067354c94deSBarry Smith 3068354c94deSBarry Smith PetscFunctionBegin; 3069354c94deSBarry Smith nz = aij->nz; 30709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30712205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3073354c94deSBarry Smith #else 3074354c94deSBarry Smith PetscFunctionBegin; 3075354c94deSBarry Smith #endif 30763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3077354c94deSBarry Smith } 3078354c94deSBarry Smith 3079ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3080d71ae5a4SJacob Faibussowitsch { 3081e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3082d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3083e34fafa9SBarry Smith PetscReal atmp; 3084985db425SBarry Smith PetscScalar *x; 3085ce496241SStefano Zampini const MatScalar *aa, *av; 3086e34fafa9SBarry Smith 3087e34fafa9SBarry Smith PetscFunctionBegin; 308828b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 30899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3090ce496241SStefano Zampini aa = av; 3091e34fafa9SBarry Smith ai = a->i; 3092e34fafa9SBarry Smith aj = a->j; 3093e34fafa9SBarry Smith 30949566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 30959566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 309608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3097e34fafa9SBarry Smith for (i = 0; i < m; i++) { 30989371c9d4SSatish Balay ncols = ai[1] - ai[0]; 30999371c9d4SSatish Balay ai++; 310062e5df07SMark Adams x[i] = 0; 3101e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3102985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31039371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31049371c9d4SSatish Balay x[i] = atmp; 31059371c9d4SSatish Balay if (idx) idx[i] = *aj; 31069371c9d4SSatish Balay } 31079371c9d4SSatish Balay aa++; 31089371c9d4SSatish Balay aj++; 3109985db425SBarry Smith } 3110985db425SBarry Smith } 31119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3114985db425SBarry Smith } 3115985db425SBarry Smith 3116eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v) 3117eede4a3fSMark Adams { 3118eede4a3fSMark Adams Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3119eede4a3fSMark Adams PetscInt i, j, m = A->rmap->n, *ai, ncols, n; 3120eede4a3fSMark Adams PetscScalar *x; 3121eede4a3fSMark Adams const MatScalar *aa, *av; 3122eede4a3fSMark Adams 3123eede4a3fSMark Adams PetscFunctionBegin; 3124eede4a3fSMark Adams PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3125eede4a3fSMark Adams PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3126eede4a3fSMark Adams aa = av; 3127eede4a3fSMark Adams ai = a->i; 3128eede4a3fSMark Adams 3129eede4a3fSMark Adams PetscCall(VecGetArrayWrite(v, &x)); 3130eede4a3fSMark Adams PetscCall(VecGetLocalSize(v, &n)); 3131eede4a3fSMark Adams PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3132eede4a3fSMark Adams for (i = 0; i < m; i++) { 3133eede4a3fSMark Adams ncols = ai[1] - ai[0]; 3134eede4a3fSMark Adams ai++; 313562e5df07SMark Adams x[i] = 0; 3136eede4a3fSMark Adams for (j = 0; j < ncols; j++) { 3137eede4a3fSMark Adams x[i] += PetscAbsScalar(*aa); 3138eede4a3fSMark Adams aa++; 3139eede4a3fSMark Adams } 3140eede4a3fSMark Adams } 3141eede4a3fSMark Adams PetscCall(VecRestoreArrayWrite(v, &x)); 3142eede4a3fSMark Adams PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 3143eede4a3fSMark Adams PetscFunctionReturn(PETSC_SUCCESS); 3144eede4a3fSMark Adams } 3145eede4a3fSMark Adams 3146ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3147d71ae5a4SJacob Faibussowitsch { 3148985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3149d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3150985db425SBarry Smith PetscScalar *x; 3151ce496241SStefano Zampini const MatScalar *aa, *av; 3152985db425SBarry Smith 3153985db425SBarry Smith PetscFunctionBegin; 315428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3156ce496241SStefano Zampini aa = av; 3157985db425SBarry Smith ai = a->i; 3158985db425SBarry Smith aj = a->j; 3159985db425SBarry Smith 31609566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 316208401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3163985db425SBarry Smith for (i = 0; i < m; i++) { 31649371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31659371c9d4SSatish Balay ai++; 3166d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31679371c9d4SSatish Balay x[i] = *aa; 31689371c9d4SSatish Balay if (idx) idx[i] = 0; 3169985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3170985db425SBarry Smith x[i] = 0.0; 3171985db425SBarry Smith if (idx) { 3172985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3173985db425SBarry Smith if (aj[j] > j) { 3174985db425SBarry Smith idx[i] = j; 3175985db425SBarry Smith break; 3176985db425SBarry Smith } 3177985db425SBarry Smith } 31781a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31791a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3180985db425SBarry Smith } 3181985db425SBarry Smith } 3182985db425SBarry Smith for (j = 0; j < ncols; j++) { 31839371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31849371c9d4SSatish Balay x[i] = *aa; 31859371c9d4SSatish Balay if (idx) idx[i] = *aj; 31869371c9d4SSatish Balay } 31879371c9d4SSatish Balay aa++; 31889371c9d4SSatish Balay aj++; 3189985db425SBarry Smith } 3190985db425SBarry Smith } 31919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3194985db425SBarry Smith } 3195985db425SBarry Smith 3196ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3197d71ae5a4SJacob Faibussowitsch { 3198c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3199c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3200ce496241SStefano Zampini PetscScalar *x; 3201ce496241SStefano Zampini const MatScalar *aa, *av; 3202c87e5d42SMatthew Knepley 3203c87e5d42SMatthew Knepley PetscFunctionBegin; 32049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3205ce496241SStefano Zampini aa = av; 3206c87e5d42SMatthew Knepley ai = a->i; 3207c87e5d42SMatthew Knepley aj = a->j; 3208c87e5d42SMatthew Knepley 32099566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32109566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 321108401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3212c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32139371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32149371c9d4SSatish Balay ai++; 3215f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32169371c9d4SSatish Balay x[i] = *aa; 32179371c9d4SSatish Balay if (idx) idx[i] = 0; 3218f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3219f07e67edSHong Zhang x[i] = 0.0; 3220f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3221289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3222f07e67edSHong Zhang if (aj[j] > j) { 3223f07e67edSHong Zhang idx[i] = j; 32242205254eSKarl Rupp break; 32252205254eSKarl Rupp } 3226289a08f5SMatthew Knepley } 3227f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3228f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3229f07e67edSHong Zhang } 3230289a08f5SMatthew Knepley } 3231c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32329371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32339371c9d4SSatish Balay x[i] = *aa; 32349371c9d4SSatish Balay if (idx) idx[i] = *aj; 32359371c9d4SSatish Balay } 32369371c9d4SSatish Balay aa++; 32379371c9d4SSatish Balay aj++; 3238c87e5d42SMatthew Knepley } 3239c87e5d42SMatthew Knepley } 32409566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3243c87e5d42SMatthew Knepley } 3244c87e5d42SMatthew Knepley 3245ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3246d71ae5a4SJacob Faibussowitsch { 3247985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3248d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3249d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3250985db425SBarry Smith PetscScalar *x; 3251ce496241SStefano Zampini const MatScalar *aa, *av; 3252985db425SBarry Smith 3253985db425SBarry Smith PetscFunctionBegin; 325428b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3256ce496241SStefano Zampini aa = av; 3257985db425SBarry Smith ai = a->i; 3258985db425SBarry Smith aj = a->j; 3259985db425SBarry Smith 32609566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32619566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 326208401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3263985db425SBarry Smith for (i = 0; i < m; i++) { 32649371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32659371c9d4SSatish Balay ai++; 3266d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32679371c9d4SSatish Balay x[i] = *aa; 32689371c9d4SSatish Balay if (idx) idx[i] = 0; 3269985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3270985db425SBarry Smith x[i] = 0.0; 3271985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3272985db425SBarry Smith for (j = 0; j < ncols; j++) { 3273985db425SBarry Smith if (aj[j] > j) { 3274985db425SBarry Smith idx[i] = j; 3275985db425SBarry Smith break; 3276985db425SBarry Smith } 3277985db425SBarry Smith } 3278fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3279fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3280985db425SBarry Smith } 3281985db425SBarry Smith } 3282985db425SBarry Smith for (j = 0; j < ncols; j++) { 32839371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32849371c9d4SSatish Balay x[i] = *aa; 32859371c9d4SSatish Balay if (idx) idx[i] = *aj; 32869371c9d4SSatish Balay } 32879371c9d4SSatish Balay aa++; 32889371c9d4SSatish Balay aj++; 3289e34fafa9SBarry Smith } 3290e34fafa9SBarry Smith } 32919566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3294e34fafa9SBarry Smith } 3295bbead8a2SBarry Smith 3296ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3297d71ae5a4SJacob Faibussowitsch { 3298bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 329933d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3300bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 33010da83c2eSBarry Smith const PetscReal shift = 0.0; 33021a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3303bbead8a2SBarry Smith 3304bbead8a2SBarry Smith PetscFunctionBegin; 3305a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33064a0d0026SBarry Smith if (a->ibdiagvalid) { 33074a0d0026SBarry Smith if (values) *values = a->ibdiag; 33083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33094a0d0026SBarry Smith } 33109566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33114dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3312bbead8a2SBarry Smith diag = a->ibdiag; 3313bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3314bbead8a2SBarry Smith /* factor and invert each block */ 3315bbead8a2SBarry Smith switch (bs) { 3316bbead8a2SBarry Smith case 1: 3317bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33189566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3319ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3320ec1892c8SHong Zhang if (allowzeropivot) { 33217b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33227b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33237b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33249566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 332598921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3326ec1892c8SHong Zhang } 3327bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3328bbead8a2SBarry Smith } 3329bbead8a2SBarry Smith break; 3330bbead8a2SBarry Smith case 2: 3331bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33329371c9d4SSatish Balay ij[0] = 2 * i; 33339371c9d4SSatish Balay ij[1] = 2 * i + 1; 33349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33359566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33367b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33379566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3338bbead8a2SBarry Smith diag += 4; 3339bbead8a2SBarry Smith } 3340bbead8a2SBarry Smith break; 3341bbead8a2SBarry Smith case 3: 3342bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33439371c9d4SSatish Balay ij[0] = 3 * i; 33449371c9d4SSatish Balay ij[1] = 3 * i + 1; 33459371c9d4SSatish Balay ij[2] = 3 * i + 2; 33469566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33487b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3350bbead8a2SBarry Smith diag += 9; 3351bbead8a2SBarry Smith } 3352bbead8a2SBarry Smith break; 3353bbead8a2SBarry Smith case 4: 3354bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33559371c9d4SSatish Balay ij[0] = 4 * i; 33569371c9d4SSatish Balay ij[1] = 4 * i + 1; 33579371c9d4SSatish Balay ij[2] = 4 * i + 2; 33589371c9d4SSatish Balay ij[3] = 4 * i + 3; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3363bbead8a2SBarry Smith diag += 16; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith case 5: 3367bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33689371c9d4SSatish Balay ij[0] = 5 * i; 33699371c9d4SSatish Balay ij[1] = 5 * i + 1; 33709371c9d4SSatish Balay ij[2] = 5 * i + 2; 33719371c9d4SSatish Balay ij[3] = 5 * i + 3; 33729371c9d4SSatish Balay ij[4] = 5 * i + 4; 33739566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33757b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3377bbead8a2SBarry Smith diag += 25; 3378bbead8a2SBarry Smith } 3379bbead8a2SBarry Smith break; 3380bbead8a2SBarry Smith case 6: 3381bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33829371c9d4SSatish Balay ij[0] = 6 * i; 33839371c9d4SSatish Balay ij[1] = 6 * i + 1; 33849371c9d4SSatish Balay ij[2] = 6 * i + 2; 33859371c9d4SSatish Balay ij[3] = 6 * i + 3; 33869371c9d4SSatish Balay ij[4] = 6 * i + 4; 33879371c9d4SSatish Balay ij[5] = 6 * i + 5; 33889566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33899566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33907b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33919566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3392bbead8a2SBarry Smith diag += 36; 3393bbead8a2SBarry Smith } 3394bbead8a2SBarry Smith break; 3395bbead8a2SBarry Smith case 7: 3396bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33979371c9d4SSatish Balay ij[0] = 7 * i; 33989371c9d4SSatish Balay ij[1] = 7 * i + 1; 33999371c9d4SSatish Balay ij[2] = 7 * i + 2; 34009371c9d4SSatish Balay ij[3] = 7 * i + 3; 34019371c9d4SSatish Balay ij[4] = 7 * i + 4; 34029371c9d4SSatish Balay ij[5] = 7 * i + 5; 3403cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34049566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34059566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34067b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34079566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3408bbead8a2SBarry Smith diag += 49; 3409bbead8a2SBarry Smith } 3410bbead8a2SBarry Smith break; 3411bbead8a2SBarry Smith default: 34129566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3413bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3414ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34159566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34169566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34177b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34189566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3419bbead8a2SBarry Smith diag += bs2; 3420bbead8a2SBarry Smith } 34219566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3422bbead8a2SBarry Smith } 3423bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3425bbead8a2SBarry Smith } 3426bbead8a2SBarry Smith 3427d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3428d71ae5a4SJacob Faibussowitsch { 342973a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3430fff043a9SJunchao Zhang PetscScalar a, *aa; 343173a71a0fSBarry Smith PetscInt m, n, i, j, col; 343273a71a0fSBarry Smith 343373a71a0fSBarry Smith PetscFunctionBegin; 343473a71a0fSBarry Smith if (!x->assembled) { 34359566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 343673a71a0fSBarry Smith for (i = 0; i < m; i++) { 343773a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34389566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 343973a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34409566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 344173a71a0fSBarry Smith } 344273a71a0fSBarry Smith } 3443e2ce353bSJunchao Zhang } else { 34449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34459566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3447e2ce353bSJunchao Zhang } 34489566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 345173a71a0fSBarry Smith } 345273a71a0fSBarry Smith 3453679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3454d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3455d71ae5a4SJacob Faibussowitsch { 3456679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3457679944adSJunchao Zhang PetscScalar a; 3458679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3459679944adSJunchao Zhang 3460679944adSJunchao Zhang PetscFunctionBegin; 3461679944adSJunchao Zhang nskip = high - low; 34629566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3463679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3464679944adSJunchao Zhang for (i = 0; i < m; i++) { 3465679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34669566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3467679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3468679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34699566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3470679944adSJunchao Zhang } 3471e2ce353bSJunchao Zhang } 34729566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34739566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3475679944adSJunchao Zhang } 3476679944adSJunchao Zhang 34770a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3478cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3479cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3480cb5b572fSBarry Smith MatMult_SeqAIJ, 348197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34827c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34837c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3484f4259b30SLisandro Dalcin NULL, 3485f4259b30SLisandro Dalcin NULL, 3486f4259b30SLisandro Dalcin NULL, 3487f4259b30SLisandro Dalcin /* 10*/ NULL, 3488cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3489f4259b30SLisandro Dalcin NULL, 349041f059aeSBarry Smith MatSOR_SeqAIJ, 349191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3493cb5b572fSBarry Smith MatEqual_SeqAIJ, 3494cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3495cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3496cb5b572fSBarry Smith MatNorm_SeqAIJ, 3497f4259b30SLisandro Dalcin /* 20*/ NULL, 3498cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3499cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3500cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3501d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 350626cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 3510f4259b30SLisandro Dalcin NULL, 3511d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3512f4259b30SLisandro Dalcin NULL, 3513f4259b30SLisandro Dalcin NULL, 3514cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3515f4259b30SLisandro Dalcin NULL, 3516d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35177dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3518cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3519cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3520cb5b572fSBarry Smith MatCopy_SeqAIJ, 3521d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3522cb5b572fSBarry Smith MatScale_SeqAIJ, 35237d68702bSBarry Smith MatShift_SeqAIJ, 352479299369SBarry Smith MatDiagonalSet_SeqAIJ, 35256e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35273b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35283b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35293b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3530a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 353193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3532f4259b30SLisandro Dalcin NULL, 3533f4259b30SLisandro Dalcin NULL, 3534cda55fadSBarry Smith MatPermute_SeqAIJ, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin /* 59*/ NULL, 3537b9b97703SBarry Smith MatDestroy_SeqAIJ, 3538b9b97703SBarry Smith MatView_SeqAIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin /* 64*/ NULL, 3542321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3543f4259b30SLisandro Dalcin NULL, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3547c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin /* 74*/ NULL, 35523acb8795SBarry Smith MatFDColoringApply_AIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 35566ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3557f4259b30SLisandro Dalcin NULL, 3558f4259b30SLisandro Dalcin NULL, 3559f4259b30SLisandro Dalcin NULL, 3560bc011b1eSHong Zhang MatLoad_SeqAIJ, 35616cff0a6bSPierre Jolivet /* 84*/ NULL, 35626cff0a6bSPierre Jolivet NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin NULL, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin /* 89*/ NULL, 3567f4259b30SLisandro Dalcin NULL, 356826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3569f4259b30SLisandro Dalcin NULL, 3570f4259b30SLisandro Dalcin NULL, 35718fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3572f4259b30SLisandro Dalcin NULL, 3573f4259b30SLisandro Dalcin NULL, 35746fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 35764222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3577f4259b30SLisandro Dalcin NULL, 3578f4259b30SLisandro Dalcin NULL, 357987d4246cSBarry Smith MatConjugate_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 3581d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 358299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3583f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3584f4259b30SLisandro Dalcin NULL, 3585f4259b30SLisandro Dalcin NULL, 3586cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3587f4259b30SLisandro Dalcin NULL, 35882af78befSBarry Smith MatGetRowMin_SeqAIJ, 3589f4259b30SLisandro Dalcin NULL, 3590599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3591f4259b30SLisandro Dalcin /*114*/ NULL, 3592f4259b30SLisandro Dalcin NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin /*119*/ NULL, 3597f4259b30SLisandro Dalcin NULL, 3598f4259b30SLisandro Dalcin NULL, 3599f4259b30SLisandro Dalcin NULL, 3600b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 36010716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3602a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36040da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin /*129*/ NULL, 3607f4259b30SLisandro Dalcin NULL, 3608f4259b30SLisandro Dalcin NULL, 360975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3610b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3611b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36122b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3613f4259b30SLisandro Dalcin NULL, 3614f4259b30SLisandro Dalcin NULL, 36153964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3616f4259b30SLisandro Dalcin /*139*/ NULL, 3617f4259b30SLisandro Dalcin NULL, 3618f4259b30SLisandro Dalcin NULL, 36193a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36209c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36214222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36224222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3623f4259b30SLisandro Dalcin NULL, 362472833a62Smarkadams4 NULL, 362572833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36262d776b49SBarry Smith NULL, 3627dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3628eede4a3fSMark Adams MatEliminateZeros_SeqAIJ, 36294cc2b5b5SPierre Jolivet MatGetRowSumAbs_SeqAIJ, 363042ce410bSJunchao Zhang NULL, 363142ce410bSJunchao Zhang NULL, 36324cc2b5b5SPierre Jolivet NULL}; 363317ab2063SBarry Smith 3634ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3635d71ae5a4SJacob Faibussowitsch { 3636bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 363797f1f81fSBarry Smith PetscInt i, nz, n; 3638bef8e0ddSBarry Smith 3639bef8e0ddSBarry Smith PetscFunctionBegin; 3640bef8e0ddSBarry Smith nz = aij->maxnz; 3641d0f46423SBarry Smith n = mat->rmap->n; 3642ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3643bef8e0ddSBarry Smith aij->nz = nz; 3644ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3646bef8e0ddSBarry Smith } 3647bef8e0ddSBarry Smith 3648a3bb6f32SFande Kong /* 3649ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3650ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3651ddea5d60SJunchao Zhang */ 3652d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3653d71ae5a4SJacob Faibussowitsch { 3654a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3655eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3656eec179cfSJacob Faibussowitsch PetscHashIter tpos; 365725b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 365825b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3659a3bb6f32SFande Kong 3660a3bb6f32SFande Kong PetscFunctionBegin; 3661a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36624f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3663a3bb6f32SFande Kong /* use a table */ 3664eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3665a3bb6f32SFande Kong ec = 0; 366625b670f0SStefano Zampini for (i = 0; i < nz; i++) { 366725b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3668eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3669a3bb6f32SFande Kong if (!data) { 3670a3bb6f32SFande Kong /* one based table */ 3671c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3672a3bb6f32SFande Kong } 3673a3bb6f32SFande Kong } 3674a3bb6f32SFande Kong /* form array of columns we need */ 36759566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3676eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3677eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3678eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3679eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3680eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3681a3bb6f32SFande Kong gid--; 3682a3bb6f32SFande Kong lid--; 3683a3bb6f32SFande Kong garray[lid] = gid; 3684a3bb6f32SFande Kong } 36859566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3686eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3687c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3688a3bb6f32SFande Kong /* compact out the extra columns in B */ 368925b670f0SStefano Zampini for (i = 0; i < nz; i++) { 369025b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3691eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3692a3bb6f32SFande Kong lid--; 369325b670f0SStefano Zampini jj[i] = lid; 3694a3bb6f32SFande Kong } 36959566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3696eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36979566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36989566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36999566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 37003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3701a3bb6f32SFande Kong } 3702a3bb6f32SFande Kong 3703bef8e0ddSBarry Smith /*@ 3704bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3705bef8e0ddSBarry Smith in the matrix. 3706bef8e0ddSBarry Smith 3707bef8e0ddSBarry Smith Input Parameters: 370811a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3709bef8e0ddSBarry Smith - indices - the column indices 3710bef8e0ddSBarry Smith 371115091d37SBarry Smith Level: advanced 371215091d37SBarry Smith 3713bef8e0ddSBarry Smith Notes: 3714bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3715bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 371611a5261eSBarry Smith of the `MatSetValues()` operation. 3717bef8e0ddSBarry Smith 3718bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371911a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3720bef8e0ddSBarry Smith 372111a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3722bef8e0ddSBarry Smith 3723b9617806SBarry Smith The indices should start with zero, not one. 3724b9617806SBarry Smith 37251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3726bef8e0ddSBarry Smith @*/ 3727d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3728d71ae5a4SJacob Faibussowitsch { 3729bef8e0ddSBarry Smith PetscFunctionBegin; 37300700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37314f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3732cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3734bef8e0ddSBarry Smith } 3735bef8e0ddSBarry Smith 3736ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3737d71ae5a4SJacob Faibussowitsch { 3738be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3739d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3740be6bf707SBarry Smith 3741be6bf707SBarry Smith PetscFunctionBegin; 374228b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3743be6bf707SBarry Smith 3744be6bf707SBarry Smith /* allocate space for values if not already there */ 37454dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3746be6bf707SBarry Smith 3747be6bf707SBarry Smith /* copy values over */ 37489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3750be6bf707SBarry Smith } 3751be6bf707SBarry Smith 3752be6bf707SBarry Smith /*@ 375320f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3754be6bf707SBarry Smith nonlinear portion. 3755be6bf707SBarry Smith 3756c3339decSBarry Smith Logically Collect 3757be6bf707SBarry Smith 375827430b45SBarry Smith Input Parameter: 375911a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3760be6bf707SBarry Smith 376115091d37SBarry Smith Level: advanced 376215091d37SBarry Smith 37632920cce0SJacob Faibussowitsch Example Usage: 376427430b45SBarry Smith .vb 37652ef1f0ffSBarry Smith Using SNES 376627430b45SBarry Smith Create Jacobian matrix 376727430b45SBarry Smith Set linear terms into matrix 376827430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 376927430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 377027430b45SBarry Smith boundary conditions again will not change the nonzero structure 377127430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377227430b45SBarry Smith MatStoreValues(mat); 377327430b45SBarry Smith Call SNESSetJacobian() with matrix 377427430b45SBarry Smith In your Jacobian routine 377527430b45SBarry Smith MatRetrieveValues(mat); 377627430b45SBarry Smith Set nonlinear terms in matrix 3777be6bf707SBarry Smith 377827430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 377927430b45SBarry Smith // build linear portion of Jacobian 378027430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 378127430b45SBarry Smith MatStoreValues(mat); 378227430b45SBarry Smith loop over nonlinear iterations 378327430b45SBarry Smith MatRetrieveValues(mat); 378427430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 378527430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 378627430b45SBarry Smith Solve linear system with Jacobian 378727430b45SBarry Smith endloop 378827430b45SBarry Smith .ve 3789be6bf707SBarry Smith 3790be6bf707SBarry Smith Notes: 3791da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 379211a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3793be6bf707SBarry Smith calling this routine. 3794be6bf707SBarry Smith 37950c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37960c468ba9SBarry Smith and does not allocated additional space. 37970c468ba9SBarry Smith 3798fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3799be6bf707SBarry Smith @*/ 3800d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3801d71ae5a4SJacob Faibussowitsch { 3802be6bf707SBarry Smith PetscFunctionBegin; 38030700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 380428b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 380528b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3806cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 38073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3808be6bf707SBarry Smith } 3809be6bf707SBarry Smith 3810ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3811d71ae5a4SJacob Faibussowitsch { 3812be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3813d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3814be6bf707SBarry Smith 3815be6bf707SBarry Smith PetscFunctionBegin; 381628b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381728b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3818be6bf707SBarry Smith /* copy values over */ 38199566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3821be6bf707SBarry Smith } 3822be6bf707SBarry Smith 3823be6bf707SBarry Smith /*@ 382420f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3825be6bf707SBarry Smith 3826c3339decSBarry Smith Logically Collect 3827be6bf707SBarry Smith 38282fe279fdSBarry Smith Input Parameter: 382911a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3830be6bf707SBarry Smith 383115091d37SBarry Smith Level: advanced 383215091d37SBarry Smith 38331cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3834be6bf707SBarry Smith @*/ 3835d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3836d71ae5a4SJacob Faibussowitsch { 3837be6bf707SBarry Smith PetscFunctionBegin; 38380700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383928b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 384028b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3841cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3843be6bf707SBarry Smith } 3844be6bf707SBarry Smith 38455d83a8b1SBarry Smith /*@ 384611a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38470d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 384820f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 384920f4b53cSBarry Smith (or the array `nnz`). 385017ab2063SBarry Smith 3851d083f849SBarry Smith Collective 3852db81eaa0SLois Curfman McInnes 385317ab2063SBarry Smith Input Parameters: 385411a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 385517ab2063SBarry Smith . m - number of rows 385617ab2063SBarry Smith . n - number of columns 385717ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385851c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38590298fd71SBarry Smith (possibly different for each row) or NULL 386017ab2063SBarry Smith 386117ab2063SBarry Smith Output Parameter: 3862416022c9SBarry Smith . A - the matrix 386317ab2063SBarry Smith 38642ef1f0ffSBarry Smith Options Database Keys: 38652ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38662ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38672ef1f0ffSBarry Smith 38682ef1f0ffSBarry Smith Level: intermediate 3869175b88e8SBarry Smith 3870b259b22eSLois Curfman McInnes Notes: 387177433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 387277433607SBarry Smith 38732ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 387449a6f317SBarry Smith 38752ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38762ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38770002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38782ef1f0ffSBarry Smith either one (as in Fortran) or zero. 387917ab2063SBarry Smith 388020f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38812ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 388220f4b53cSBarry Smith allocation. 388317ab2063SBarry Smith 3884682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38854fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3886682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38876c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38886c7ebb05SLois Curfman McInnes 38891cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 389017ab2063SBarry Smith @*/ 3891d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3892d71ae5a4SJacob Faibussowitsch { 38933a40ed3dSBarry Smith PetscFunctionBegin; 38949566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38959566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38969566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3899273d9f13SBarry Smith } 3900273d9f13SBarry Smith 39015d83a8b1SBarry Smith /*@ 3902273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3903273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3904273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3905273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3906273d9f13SBarry Smith 3907d083f849SBarry Smith Collective 3908273d9f13SBarry Smith 3909273d9f13SBarry Smith Input Parameters: 39101c4f3114SJed Brown + B - The matrix 3911273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3912273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39130298fd71SBarry Smith (possibly different for each row) or NULL 3914273d9f13SBarry Smith 39152ef1f0ffSBarry Smith Options Database Keys: 39162ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39172ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39182ef1f0ffSBarry Smith 39192ef1f0ffSBarry Smith Level: intermediate 39202ef1f0ffSBarry Smith 3921273d9f13SBarry Smith Notes: 39222ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 392349a6f317SBarry Smith 392411a5261eSBarry Smith The `MATSEQAIJ` format also called 39252ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3926273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3927273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3928273d9f13SBarry Smith 39292ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39302ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39312ef1f0ffSBarry Smith allocation. 3932273d9f13SBarry Smith 393311a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3934aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3935aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3936aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3937aa95bbe8SBarry Smith 393811a5261eSBarry Smith Developer Notes: 393911a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3940a96a251dSBarry Smith entries or columns indices 3941a96a251dSBarry Smith 3942273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3943273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3944273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3945273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3946273d9f13SBarry Smith 39471cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3948db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3949273d9f13SBarry Smith @*/ 3950d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3951d71ae5a4SJacob Faibussowitsch { 3952a23d5eceSKris Buschelman PetscFunctionBegin; 39536ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39546ba663aaSJed Brown PetscValidType(B, 1); 3955cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3957a23d5eceSKris Buschelman } 3958a23d5eceSKris Buschelman 3959d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3960d71ae5a4SJacob Faibussowitsch { 3961ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39622576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 396397f1f81fSBarry Smith PetscInt i; 3964273d9f13SBarry Smith 3965273d9f13SBarry Smith PetscFunctionBegin; 3966ad79cf63SBarry Smith if (B->hash_active) { 3967aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3968ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3969ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3970ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3971ad79cf63SBarry Smith } 39722576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3973a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3974c461c341SBarry Smith skipallocation = PETSC_TRUE; 3975c461c341SBarry Smith nz = 0; 3976c461c341SBarry Smith } 39779566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39789566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3979899cda47SBarry Smith 3980435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 398108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 39829f0612e4SBarry Smith if (nnz) { 3983d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 398408401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 398508401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3986b73539f3SBarry Smith } 3987b73539f3SBarry Smith } 3988b73539f3SBarry Smith 3989273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3990ab93d7beSBarry Smith if (!skipallocation) { 39914dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3992071fcb05SBarry Smith if (!b->ilen) { 3993071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39949566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3995071fcb05SBarry Smith } else { 39969566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39972ee49352SLisandro Dalcin } 3998aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3999273d9f13SBarry Smith if (!nnz) { 4000435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4001c62bd62aSJed Brown else if (nz < 0) nz = 1; 40025d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 4003d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 4004c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 4005273d9f13SBarry Smith } else { 4006c73702f5SBarry Smith PetscInt64 nz64 = 0; 40079371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40089371c9d4SSatish Balay b->imax[i] = nnz[i]; 40099371c9d4SSatish Balay nz64 += nnz[i]; 40109371c9d4SSatish Balay } 40119566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4012273d9f13SBarry Smith } 4013ab93d7beSBarry Smith 4014273d9f13SBarry Smith /* allocate the matrix space */ 40159566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 40169f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j)); 40179f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i)); 40189f0612e4SBarry Smith b->free_ij = PETSC_TRUE; 4019396832f4SHong Zhang if (B->structure_only) { 40209f0612e4SBarry Smith b->free_a = PETSC_FALSE; 4021396832f4SHong Zhang } else { 40229f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a)); 40239f0612e4SBarry Smith b->free_a = PETSC_TRUE; 4024396832f4SHong Zhang } 4025bfeeae90SHong Zhang b->i[0] = 0; 4026ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4027c461c341SBarry Smith } else { 4028e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4029e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4030c461c341SBarry Smith } 4031273d9f13SBarry Smith 4032846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4033846b4da1SFande Kong /* reserve user-requested sparsity */ 40349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4035846b4da1SFande Kong } 4036846b4da1SFande Kong 4037273d9f13SBarry Smith b->nz = 0; 4038273d9f13SBarry Smith b->maxnz = nz; 4039273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40401baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4041cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4042cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40435519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40445519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40455519a089SJose E. Roman */ 40465519a089SJose E. Roman B->nonzerostate++; 40473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4048273d9f13SBarry Smith } 4049273d9f13SBarry Smith 4050*4c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset) 4051d71ae5a4SJacob Faibussowitsch { 4052846b4da1SFande Kong Mat_SeqAIJ *a; 4053a5bbaf83SFande Kong PetscInt i; 40541f14be2bSBarry Smith PetscBool skipreset; 4055846b4da1SFande Kong 4056846b4da1SFande Kong PetscFunctionBegin; 4057846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405814d0e64fSAlex Lindsay 4059*4c51d546SAlexander PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()"); 4060*4c51d546SAlexander if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS); 4061*4c51d546SAlexander 406214d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40633ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 406414d0e64fSAlex Lindsay 4065846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40662c814fdeSFande Kong /* if no saved info, we error out */ 406728b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40682c814fdeSFande Kong 40691f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation "); 40702c814fdeSFande Kong 40711f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 4072*4c51d546SAlexander if (skipreset) PetscCall(MatZeroEntries(A)); 4073*4c51d546SAlexander else { 40749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40759566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4076846b4da1SFande Kong a->i[0] = 0; 4077ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4078846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4079846b4da1SFande Kong a->nz = 0; 4080846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4081846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4082846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4083846b4da1SFande Kong A->assembled = PETSC_FALSE; 4084b3a35320SAlex Lindsay A->nonzerostate++; 4085b3a35320SAlex Lindsay /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */ 4086b3a35320SAlex Lindsay PetscCall(PetscObjectStateIncrease((PetscObject)A)); 40871f14be2bSBarry Smith } 4088*4c51d546SAlexander if (memoryreset) *memoryreset = (PetscBool)!skipreset; 4089*4c51d546SAlexander PetscFunctionReturn(PETSC_SUCCESS); 4090*4c51d546SAlexander } 4091*4c51d546SAlexander 4092*4c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4093*4c51d546SAlexander { 4094*4c51d546SAlexander PetscFunctionBegin; 4095*4c51d546SAlexander PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL)); 40963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4097846b4da1SFande Kong } 4098846b4da1SFande Kong 409958d36128SBarry Smith /*@ 410011a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4101a1661176SMatthew Knepley 4102a1661176SMatthew Knepley Input Parameters: 4103a1661176SMatthew Knepley + B - the matrix 4104d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero) 4105d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row 4106d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided 4107a1661176SMatthew Knepley 4108a1661176SMatthew Knepley Level: developer 4109a1661176SMatthew Knepley 41106a9b8d82SBarry Smith Notes: 41112ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 411258d36128SBarry Smith 41136a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41146a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41156a9b8d82SBarry Smith 41166a9b8d82SBarry Smith Developer Notes: 41172ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41182ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41196a9b8d82SBarry Smith 412011a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41216a9b8d82SBarry Smith 4122fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4123a1661176SMatthew Knepley @*/ 4124d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4125d71ae5a4SJacob Faibussowitsch { 4126a1661176SMatthew Knepley PetscFunctionBegin; 41270700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41286ba663aaSJed Brown PetscValidType(B, 1); 4129cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4131a1661176SMatthew Knepley } 4132a1661176SMatthew Knepley 4133ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4134d71ae5a4SJacob Faibussowitsch { 4135a1661176SMatthew Knepley PetscInt i; 4136a1661176SMatthew Knepley PetscInt m, n; 4137a1661176SMatthew Knepley PetscInt nz; 41386a9b8d82SBarry Smith PetscInt *nnz; 4139a1661176SMatthew Knepley 4140a1661176SMatthew Knepley PetscFunctionBegin; 4141aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4142779a8d59SSatish Balay 41439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41449566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4145779a8d59SSatish Balay 41469566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4148a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4149b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 415008401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4151a1661176SMatthew Knepley nnz[i] = nz; 4152a1661176SMatthew Knepley } 41539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41549566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4155a1661176SMatthew Knepley 41568e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4157a1661176SMatthew Knepley 41589566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41599566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4160a1661176SMatthew Knepley 41619566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4163a1661176SMatthew Knepley } 4164a1661176SMatthew Knepley 4165ad7e164aSPierre Jolivet /*@ 41662ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4167ad7e164aSPierre Jolivet 4168ad7e164aSPierre Jolivet Input Parameters: 4169ad7e164aSPierre Jolivet + A - left-hand side matrix 4170ad7e164aSPierre Jolivet . B - right-hand side matrix 417111a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4172ad7e164aSPierre Jolivet 4173ad7e164aSPierre Jolivet Output Parameter: 41742ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4175ad7e164aSPierre Jolivet 4176ad7e164aSPierre Jolivet Level: intermediate 4177ad7e164aSPierre Jolivet 417811a5261eSBarry Smith Note: 417911a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4180ad7e164aSPierre Jolivet 41811cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4182ad7e164aSPierre Jolivet @*/ 4183d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4184d71ae5a4SJacob Faibussowitsch { 4185ad7e164aSPierre Jolivet PetscFunctionBegin; 4186ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4187ad7e164aSPierre Jolivet PetscValidType(A, 1); 4188ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4189ad7e164aSPierre Jolivet PetscValidType(B, 2); 41904f572ea9SToby Isaac PetscAssertPointer(C, 4); 4191ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4192ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4193ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4194ad7e164aSPierre Jolivet } 4195cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4197ad7e164aSPierre Jolivet } 4198ad7e164aSPierre Jolivet 4199ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4200d71ae5a4SJacob Faibussowitsch { 4201ad7e164aSPierre Jolivet Mat newmat; 4202ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4203ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4204ad7e164aSPierre Jolivet PetscScalar *v; 4205fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4206ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4207ad7e164aSPierre Jolivet PetscBool flg; 4208ad7e164aSPierre Jolivet 4209ad7e164aSPierre Jolivet PetscFunctionBegin; 421028b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421128b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 421228b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 421328b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 42149566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 421528b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4216aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4217ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42189566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42199566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42209566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42219566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4222ad7e164aSPierre Jolivet i[0] = 0; 4223ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4224ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4225ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4226ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4227ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4228ad7e164aSPierre Jolivet } 4229ad7e164aSPierre Jolivet } 4230ad7e164aSPierre Jolivet } 42319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4232ad7e164aSPierre Jolivet *C = newmat; 42339566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4234ad7e164aSPierre Jolivet nnz = 0; 4235ad7e164aSPierre Jolivet } 42369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4239ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4240ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4241ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4242ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4243ad7e164aSPierre Jolivet } 4244ad7e164aSPierre Jolivet } 4245ad7e164aSPierre Jolivet } 42469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4250ad7e164aSPierre Jolivet } 4251ad7e164aSPierre Jolivet 4252c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4253af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4254170fe5c8SBarry Smith 4255170fe5c8SBarry Smith /* 4256170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4257170fe5c8SBarry Smith 4258170fe5c8SBarry Smith n p p 42592da392ccSBarry Smith [ ] [ ] [ ] 42602da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42612da392ccSBarry Smith [ ] [ ] [ ] 4262170fe5c8SBarry Smith 4263170fe5c8SBarry Smith */ 4264d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4265d71ae5a4SJacob Faibussowitsch { 4266170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4267170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4268170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 426986214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4270170fe5c8SBarry Smith const PetscInt *ii, *idx; 4271170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4272170fe5c8SBarry Smith PetscScalar *c, *c_q; 427386214ceeSStefano Zampini PetscInt clda = sub_c->lda; 427486214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4275170fe5c8SBarry Smith 4276170fe5c8SBarry Smith PetscFunctionBegin; 4277d0f46423SBarry Smith m = A->rmap->n; 4278d0f46423SBarry Smith n = A->cmap->n; 4279d0f46423SBarry Smith p = B->cmap->n; 4280170fe5c8SBarry Smith a = sub_a->v; 4281170fe5c8SBarry Smith b = sub_b->a; 4282170fe5c8SBarry Smith c = sub_c->v; 428386214ceeSStefano Zampini if (clda == m) { 42849566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 428586214ceeSStefano Zampini } else { 428686214ceeSStefano Zampini for (j = 0; j < p; j++) 42879371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 428886214ceeSStefano Zampini } 4289170fe5c8SBarry Smith ii = sub_b->i; 4290170fe5c8SBarry Smith idx = sub_b->j; 4291170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4292170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4293170fe5c8SBarry Smith while (q-- > 0) { 429486214ceeSStefano Zampini c_q = c + clda * (*idx); 429586214ceeSStefano Zampini a_q = a + alda * i; 4296854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4297170fe5c8SBarry Smith idx++; 4298170fe5c8SBarry Smith b++; 4299170fe5c8SBarry Smith } 4300170fe5c8SBarry Smith } 43013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4302170fe5c8SBarry Smith } 4303170fe5c8SBarry Smith 4304d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4305d71ae5a4SJacob Faibussowitsch { 4306d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 430786214ceeSStefano Zampini PetscBool cisdense; 4308170fe5c8SBarry Smith 4309170fe5c8SBarry Smith PetscFunctionBegin; 431008401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 43119566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 43129566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4313d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 431448a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 43159566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4316d73949e8SHong Zhang 43174222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4319170fe5c8SBarry Smith } 4320170fe5c8SBarry Smith 43210bad9183SKris Buschelman /*MC 4322fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43230bad9183SKris Buschelman based on compressed sparse row format. 43240bad9183SKris Buschelman 43252ef1f0ffSBarry Smith Options Database Key: 43260bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43270bad9183SKris Buschelman 43280bad9183SKris Buschelman Level: beginner 43290bad9183SKris Buschelman 43300cd7f59aSBarry Smith Notes: 43312ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43320cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43330cd7f59aSBarry Smith in the matrix 43340cd7f59aSBarry Smith 433511a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 433611a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43370cd7f59aSBarry Smith 433811a5261eSBarry Smith Developer Note: 43392ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43400cd7f59aSBarry Smith 43411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43420bad9183SKris Buschelman M*/ 43430bad9183SKris Buschelman 4344ccd284c7SBarry Smith /*MC 4345ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4346ccd284c7SBarry Smith 434711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 434811a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 434911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4350ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4351ccd284c7SBarry Smith the above preallocation routines for simplicity. 4352ccd284c7SBarry Smith 43532ef1f0ffSBarry Smith Options Database Key: 435411a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4355ccd284c7SBarry Smith 43562ef1f0ffSBarry Smith Level: beginner 43572ef1f0ffSBarry Smith 435811a5261eSBarry Smith Note: 435911a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4360ccd284c7SBarry Smith enough exist. 4361ccd284c7SBarry Smith 43621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4363ccd284c7SBarry Smith M*/ 4364ccd284c7SBarry Smith 4365ccd284c7SBarry Smith /*MC 4366ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4367ccd284c7SBarry Smith 43682ef1f0ffSBarry Smith Options Database Key: 43692ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43702ef1f0ffSBarry Smith 43712ef1f0ffSBarry Smith Level: beginner 43722ef1f0ffSBarry Smith 43732ef1f0ffSBarry Smith Note: 437411a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 437511a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 437611a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4377ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4378ccd284c7SBarry Smith the above preallocation routines for simplicity. 4379ccd284c7SBarry Smith 43801cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4381ccd284c7SBarry Smith M*/ 4382ccd284c7SBarry Smith 43837906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43847906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43857906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43867906f579SHong Zhang #endif 4387d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4388d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4389d24d4204SJose E. Roman #endif 43907906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43917906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43927906f579SHong Zhang #endif 43937906f579SHong Zhang 4394d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4395c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43964222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43977906f579SHong Zhang 43988c778c55SBarry Smith /*@C 439911a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 44008c778c55SBarry Smith 44018c778c55SBarry Smith Not Collective 44028c778c55SBarry Smith 44038c778c55SBarry Smith Input Parameter: 4404fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44058c778c55SBarry Smith 44068c778c55SBarry Smith Output Parameter: 44078c778c55SBarry Smith . array - pointer to the data 44088c778c55SBarry Smith 44098c778c55SBarry Smith Level: intermediate 44108c778c55SBarry Smith 4411fe59aa6dSJacob Faibussowitsch Fortran Notes: 44120ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 44130ab4885dSBarry Smith 44141cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 44158c778c55SBarry Smith @*/ 44165d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[]) 4417d71ae5a4SJacob Faibussowitsch { 4418d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44198c778c55SBarry Smith 44208c778c55SBarry Smith PetscFunctionBegin; 4421d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44229566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4423d67d9f35SJunchao Zhang } else { 4424d67d9f35SJunchao Zhang *array = aij->a; 4425d67d9f35SJunchao Zhang } 44263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4427d67d9f35SJunchao Zhang } 4428d67d9f35SJunchao Zhang 4429d67d9f35SJunchao Zhang /*@C 443011a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4431d67d9f35SJunchao Zhang 4432d67d9f35SJunchao Zhang Not Collective 4433d67d9f35SJunchao Zhang 4434d67d9f35SJunchao Zhang Input Parameters: 4435fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4436d67d9f35SJunchao Zhang - array - pointer to the data 4437d67d9f35SJunchao Zhang 4438d67d9f35SJunchao Zhang Level: intermediate 4439d67d9f35SJunchao Zhang 4440fe59aa6dSJacob Faibussowitsch Fortran Notes: 44410ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44420ab4885dSBarry Smith 44431cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4444d67d9f35SJunchao Zhang @*/ 44455d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[]) 4446d71ae5a4SJacob Faibussowitsch { 4447d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4448d67d9f35SJunchao Zhang 4449d67d9f35SJunchao Zhang PetscFunctionBegin; 4450d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44519566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4452d67d9f35SJunchao Zhang } else { 4453d67d9f35SJunchao Zhang *array = NULL; 4454d67d9f35SJunchao Zhang } 44559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44569566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44588c778c55SBarry Smith } 44598c778c55SBarry Smith 446021e72a00SBarry Smith /*@C 446111a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44628f1ea47aSStefano Zampini 44630ab4885dSBarry Smith Not Collective; No Fortran Support 44648f1ea47aSStefano Zampini 44658f1ea47aSStefano Zampini Input Parameter: 4466fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44678f1ea47aSStefano Zampini 44688f1ea47aSStefano Zampini Output Parameter: 44698f1ea47aSStefano Zampini . array - pointer to the data 44708f1ea47aSStefano Zampini 44718f1ea47aSStefano Zampini Level: intermediate 44728f1ea47aSStefano Zampini 44731cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44748f1ea47aSStefano Zampini @*/ 44755d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[]) 4476d71ae5a4SJacob Faibussowitsch { 4477d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44788f1ea47aSStefano Zampini 44798f1ea47aSStefano Zampini PetscFunctionBegin; 4480d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44819566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4482d67d9f35SJunchao Zhang } else { 4483d67d9f35SJunchao Zhang *array = aij->a; 4484d67d9f35SJunchao Zhang } 44853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44868f1ea47aSStefano Zampini } 44878f1ea47aSStefano Zampini 44888f1ea47aSStefano Zampini /*@C 448911a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44908f1ea47aSStefano Zampini 44910ab4885dSBarry Smith Not Collective; No Fortran Support 44928f1ea47aSStefano Zampini 44938f1ea47aSStefano Zampini Input Parameter: 4494fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44958f1ea47aSStefano Zampini 44968f1ea47aSStefano Zampini Output Parameter: 44978f1ea47aSStefano Zampini . array - pointer to the data 44988f1ea47aSStefano Zampini 44998f1ea47aSStefano Zampini Level: intermediate 45008f1ea47aSStefano Zampini 45011cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45028f1ea47aSStefano Zampini @*/ 45035d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[]) 4504d71ae5a4SJacob Faibussowitsch { 4505d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 45068f1ea47aSStefano Zampini 45078f1ea47aSStefano Zampini PetscFunctionBegin; 4508d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45099566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4510d67d9f35SJunchao Zhang } else { 4511d67d9f35SJunchao Zhang *array = NULL; 4512d67d9f35SJunchao Zhang } 45133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4514d67d9f35SJunchao Zhang } 4515d67d9f35SJunchao Zhang 4516d67d9f35SJunchao Zhang /*@C 451711a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4518d67d9f35SJunchao Zhang 45190ab4885dSBarry Smith Not Collective; No Fortran Support 4520d67d9f35SJunchao Zhang 4521d67d9f35SJunchao Zhang Input Parameter: 4522fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4523d67d9f35SJunchao Zhang 4524d67d9f35SJunchao Zhang Output Parameter: 4525d67d9f35SJunchao Zhang . array - pointer to the data 4526d67d9f35SJunchao Zhang 4527d67d9f35SJunchao Zhang Level: intermediate 4528d67d9f35SJunchao Zhang 45291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4530d67d9f35SJunchao Zhang @*/ 45315d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[]) 4532d71ae5a4SJacob Faibussowitsch { 4533d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4534d67d9f35SJunchao Zhang 4535d67d9f35SJunchao Zhang PetscFunctionBegin; 4536d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45379566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4538d67d9f35SJunchao Zhang } else { 4539d67d9f35SJunchao Zhang *array = aij->a; 4540d67d9f35SJunchao Zhang } 45419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45429566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4544d67d9f35SJunchao Zhang } 4545d67d9f35SJunchao Zhang 4546d67d9f35SJunchao Zhang /*@C 4547d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4548d67d9f35SJunchao Zhang 45490ab4885dSBarry Smith Not Collective; No Fortran Support 4550d67d9f35SJunchao Zhang 4551d67d9f35SJunchao Zhang Input Parameter: 4552fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4553d67d9f35SJunchao Zhang 4554d67d9f35SJunchao Zhang Output Parameter: 4555d67d9f35SJunchao Zhang . array - pointer to the data 4556d67d9f35SJunchao Zhang 4557d67d9f35SJunchao Zhang Level: intermediate 4558d67d9f35SJunchao Zhang 45591cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4560d67d9f35SJunchao Zhang @*/ 45615d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[]) 4562d71ae5a4SJacob Faibussowitsch { 4563d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4564d67d9f35SJunchao Zhang 4565d67d9f35SJunchao Zhang PetscFunctionBegin; 4566d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45679566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4568d67d9f35SJunchao Zhang } else { 4569d67d9f35SJunchao Zhang *array = NULL; 4570d67d9f35SJunchao Zhang } 45713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45728f1ea47aSStefano Zampini } 45738f1ea47aSStefano Zampini 45748f1ea47aSStefano Zampini /*@C 457511a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45767ee59b9bSJunchao Zhang 45770ab4885dSBarry Smith Not Collective; No Fortran Support 45787ee59b9bSJunchao Zhang 45797ee59b9bSJunchao Zhang Input Parameter: 458011a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45817ee59b9bSJunchao Zhang 45827ee59b9bSJunchao Zhang Output Parameters: 45837ee59b9bSJunchao Zhang + i - row map array of the matrix 45847ee59b9bSJunchao Zhang . j - column index array of the matrix 45857ee59b9bSJunchao Zhang . a - data array of the matrix 4586fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45877ee59b9bSJunchao Zhang 4588fe59aa6dSJacob Faibussowitsch Level: developer 45892ef1f0ffSBarry Smith 45907ee59b9bSJunchao Zhang Notes: 45912ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45927ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45937ee59b9bSJunchao Zhang 45947ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45952ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45967ee59b9bSJunchao Zhang 45971cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45987ee59b9bSJunchao Zhang @*/ 45995d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype) 4600d71ae5a4SJacob Faibussowitsch { 46017ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 46027ee59b9bSJunchao Zhang 46037ee59b9bSJunchao Zhang PetscFunctionBegin; 46047ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 46057ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46067ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 46077ee59b9bSJunchao Zhang } else { 46087ee59b9bSJunchao Zhang if (i) *i = aij->i; 46097ee59b9bSJunchao Zhang if (j) *j = aij->j; 46107ee59b9bSJunchao Zhang if (a) *a = aij->a; 46117ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46127ee59b9bSJunchao Zhang } 46133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 46147ee59b9bSJunchao Zhang } 46157ee59b9bSJunchao Zhang 4616cc4c1da9SBarry Smith /*@ 461721e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 461821e72a00SBarry Smith 461921e72a00SBarry Smith Not Collective 462021e72a00SBarry Smith 462121e72a00SBarry Smith Input Parameter: 4622fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 462321e72a00SBarry Smith 462421e72a00SBarry Smith Output Parameter: 462521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 462621e72a00SBarry Smith 462721e72a00SBarry Smith Level: intermediate 462821e72a00SBarry Smith 46291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 463021e72a00SBarry Smith @*/ 4631d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4632d71ae5a4SJacob Faibussowitsch { 463321e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 463421e72a00SBarry Smith 463521e72a00SBarry Smith PetscFunctionBegin; 463621e72a00SBarry Smith *nz = aij->rmax; 46373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 463821e72a00SBarry Smith } 463921e72a00SBarry Smith 46402c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46412c4ab24aSJunchao Zhang { 46422c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46434d86920dSPierre Jolivet 46442c4ab24aSJunchao Zhang PetscFunctionBegin; 46452c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46462c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46472c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46482c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46492c4ab24aSJunchao Zhang } 46502c4ab24aSJunchao Zhang 4651d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4652d71ae5a4SJacob Faibussowitsch { 4653394ed5ebSJunchao Zhang MPI_Comm comm; 4654394ed5ebSJunchao Zhang PetscInt *i, *j; 46550d88f7f4SJunchao Zhang PetscInt M, N, row, iprev; 4656394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4657394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4658394ed5ebSJunchao Zhang PetscInt *Aj; 4659394ed5ebSJunchao Zhang PetscScalar *Aa; 4660f4f49eeaSPierre Jolivet Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)mat->data; 4661cbc6b225SStefano Zampini MatType rtype; 4662394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46632c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 46640d88f7f4SJunchao Zhang PetscBool isorted; 46659f0612e4SBarry Smith PetscBool hypre; 46669f0612e4SBarry Smith const char *name; 4667394ed5ebSJunchao Zhang 4668394ed5ebSJunchao Zhang PetscFunctionBegin; 46699566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46709566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4671e8729f6fSJunchao Zhang i = coo_i; 4672e8729f6fSJunchao Zhang j = coo_j; 46739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 46740d88f7f4SJunchao Zhang 46750d88f7f4SJunchao Zhang /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */ 46760d88f7f4SJunchao Zhang isorted = PETSC_TRUE; 46770d88f7f4SJunchao Zhang iprev = PETSC_INT_MIN; 46780d88f7f4SJunchao Zhang for (k = 0; k < coo_n; k++) { 4679394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 46800d88f7f4SJunchao Zhang if (isorted) { 46810d88f7f4SJunchao Zhang if (i[k] < iprev) isorted = PETSC_FALSE; 46820d88f7f4SJunchao Zhang else iprev = i[k]; 46830d88f7f4SJunchao Zhang } 4684394ed5ebSJunchao Zhang perm[k] = k; 4685394ed5ebSJunchao Zhang } 4686394ed5ebSJunchao Zhang 46870d88f7f4SJunchao Zhang /* Sort by row if not already */ 46880d88f7f4SJunchao Zhang if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4689651b1cf9SStefano Zampini 4690651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4691651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46929371c9d4SSatish Balay if (i[k] >= 0) break; 4693394ed5ebSJunchao Zhang nneg = k; 46949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4695394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 469635cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4697394ed5ebSJunchao Zhang 46989f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */ 46999f0612e4SBarry Smith PetscCall(PetscArrayzero(Ai, M + 1)); 47009f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4701394ed5ebSJunchao Zhang 4702651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4703651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4704651b1cf9SStefano Zampini 4705394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 470635cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4707394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4708394ed5ebSJunchao Zhang while (k < coo_n) { 47090d88f7f4SJunchao Zhang PetscBool strictly_sorted; // this row is strictly sorted? 47100d88f7f4SJunchao Zhang PetscInt jprev; 47110d88f7f4SJunchao Zhang 47120d88f7f4SJunchao Zhang /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */ 4713394ed5ebSJunchao Zhang row = i[k]; 47140d88f7f4SJunchao Zhang start = k; 47150d88f7f4SJunchao Zhang jprev = PETSC_INT_MIN; 47160d88f7f4SJunchao Zhang strictly_sorted = PETSC_TRUE; 47170d88f7f4SJunchao Zhang while (k < coo_n && i[k] == row) { 47180d88f7f4SJunchao Zhang if (strictly_sorted) { 47190d88f7f4SJunchao Zhang if (j[k] <= jprev) strictly_sorted = PETSC_FALSE; 47200d88f7f4SJunchao Zhang else jprev = j[k]; 47210d88f7f4SJunchao Zhang } 47220d88f7f4SJunchao Zhang k++; 47230d88f7f4SJunchao Zhang } 4724394ed5ebSJunchao Zhang end = k; 47250d88f7f4SJunchao Zhang 4726651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4727651b1cf9SStefano Zampini if (hypre) { 47281690c2aeSBarry Smith PetscInt minj = PETSC_INT_MAX; 4729651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 47300d88f7f4SJunchao Zhang 47310d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to swap the first and the diag 47320d88f7f4SJunchao Zhang PetscCount tmp; 47330d88f7f4SJunchao Zhang for (p = start; p < end; p++) { 47340d88f7f4SJunchao Zhang if (j[p] == row && p != start) { 47350d88f7f4SJunchao Zhang j[p] = j[start]; 47360d88f7f4SJunchao Zhang j[start] = row; 47370d88f7f4SJunchao Zhang tmp = perm[start]; 47380d88f7f4SJunchao Zhang perm[start] = perm[p]; 47390d88f7f4SJunchao Zhang perm[p] = tmp; 47400d88f7f4SJunchao Zhang break; 47410d88f7f4SJunchao Zhang } 47420d88f7f4SJunchao Zhang } 47430d88f7f4SJunchao Zhang } else { 4744651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4745651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4746651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4747651b1cf9SStefano Zampini } 47480d88f7f4SJunchao Zhang 4749651b1cf9SStefano Zampini if (hasdiag) { 4750651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4751651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4752651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4753651b1cf9SStefano Zampini } 4754651b1cf9SStefano Zampini } 4755651b1cf9SStefano Zampini } 47560d88f7f4SJunchao Zhang } 47570d88f7f4SJunchao Zhang // sort by columns in a row 47580d88f7f4SJunchao Zhang if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4759651b1cf9SStefano Zampini 47600d88f7f4SJunchao Zhang if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q 47610d88f7f4SJunchao Zhang for (p = start; p < end; p++, q++) { 47620d88f7f4SJunchao Zhang Aj[q] = j[p]; 47630d88f7f4SJunchao Zhang jmap[q] = 1; 47640d88f7f4SJunchao Zhang } 47656497c311SBarry Smith PetscCall(PetscIntCast(end - start, Ai + row)); 47660d88f7f4SJunchao Zhang nnz += Ai[row]; // q is already advanced 47670d88f7f4SJunchao Zhang } else { 4768394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4769394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4770651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4771394ed5ebSJunchao Zhang Ai[row] = 1; 4772394ed5ebSJunchao Zhang nnz++; 4773394ed5ebSJunchao Zhang 4774394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4775394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4776394ed5ebSJunchao Zhang q++; 4777394ed5ebSJunchao Zhang jmap[q] = 1; 4778394ed5ebSJunchao Zhang Aj[q] = j[p]; 4779394ed5ebSJunchao Zhang Ai[row]++; 4780394ed5ebSJunchao Zhang nnz++; 4781394ed5ebSJunchao Zhang } else { 4782394ed5ebSJunchao Zhang jmap[q]++; 4783394ed5ebSJunchao Zhang } 4784394ed5ebSJunchao Zhang } 4785394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4786394ed5ebSJunchao Zhang } 47870d88f7f4SJunchao Zhang } 47880d88f7f4SJunchao Zhang 4789394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4790394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 47910d88f7f4SJunchao Zhang jmap--; // Back to the beginning of jmap[] 4792394ed5ebSJunchao Zhang jmap[0] = 0; 4793394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 47940d88f7f4SJunchao Zhang 47959f0612e4SBarry Smith if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */ 4796394ed5ebSJunchao Zhang PetscCount *jmap_new; 4797394ed5ebSJunchao Zhang PetscInt *Aj_new; 4798394ed5ebSJunchao Zhang 47999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 48009566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 48019566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4802394ed5ebSJunchao Zhang jmap = jmap_new; 4803394ed5ebSJunchao Zhang 48049f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new)); 48059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 48069f0612e4SBarry Smith PetscCall(PetscShmgetDeallocateArray((void **)&Aj)); 4807394ed5ebSJunchao Zhang Aj = Aj_new; 4808394ed5ebSJunchao Zhang } 4809394ed5ebSJunchao Zhang 4810394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4811394ed5ebSJunchao Zhang PetscCount *perm_new; 4812cbc6b225SStefano Zampini 48139566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 48149566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 48159566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4816394ed5ebSJunchao Zhang perm = perm_new; 4817394ed5ebSJunchao Zhang } 4818394ed5ebSJunchao Zhang 48199566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 48209f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa)); 48219f0612e4SBarry Smith PetscCall(PetscArrayzero(Aa, nnz)); 48229566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4823394ed5ebSJunchao Zhang 4824394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 48252c4ab24aSJunchao Zhang 48262c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 48272c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 48286497c311SBarry Smith PetscCall(PetscIntCast(nnz, &coo->nz)); 48292c4ab24aSJunchao Zhang coo->n = coo_n; 48302c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 48312c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 48322c4ab24aSJunchao Zhang coo->perm = perm; 483303e76207SPierre Jolivet PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ)); 48343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4835394ed5ebSJunchao Zhang } 4836394ed5ebSJunchao Zhang 4837d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4838d71ae5a4SJacob Faibussowitsch { 4839394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4840394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 48412c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4842394ed5ebSJunchao Zhang PetscScalar *Aa; 48432c4ab24aSJunchao Zhang PetscContainer container; 48442c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4845394ed5ebSJunchao Zhang 4846394ed5ebSJunchao Zhang PetscFunctionBegin; 48472c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 48482c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 48492c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 48502c4ab24aSJunchao Zhang perm = coo->perm; 48512c4ab24aSJunchao Zhang jmap = coo->jmap; 48529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4853394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4854b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4855b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4856b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4857394ed5ebSJunchao Zhang } 48589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 48593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4860394ed5ebSJunchao Zhang } 4861394ed5ebSJunchao Zhang 486234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48635063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 486402fe1965SBarry Smith #endif 4865d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4866d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4867d5e393b6SSuyash Tandon #endif 48683d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48695063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48703d0639e7SStefano Zampini #endif 487102fe1965SBarry Smith 4872d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4873d71ae5a4SJacob Faibussowitsch { 4874273d9f13SBarry Smith Mat_SeqAIJ *b; 487538baddfdSBarry Smith PetscMPIInt size; 4876273d9f13SBarry Smith 4877273d9f13SBarry Smith PetscFunctionBegin; 48789566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 487908401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4880273d9f13SBarry Smith 48814dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48822205254eSKarl Rupp 4883b0a32e0cSBarry Smith B->data = (void *)b; 4884aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4885071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48862205254eSKarl Rupp 4887f4259b30SLisandro Dalcin b->row = NULL; 4888f4259b30SLisandro Dalcin b->col = NULL; 4889f4259b30SLisandro Dalcin b->icol = NULL; 4890b810aeb4SBarry Smith b->reallocs = 0; 489136db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4892f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4893416022c9SBarry Smith b->nonew = 0; 4894f4259b30SLisandro Dalcin b->diag = NULL; 4895f4259b30SLisandro Dalcin b->solve_work = NULL; 4896f4259b30SLisandro Dalcin B->spptr = NULL; 4897f4259b30SLisandro Dalcin b->saved_values = NULL; 4898f4259b30SLisandro Dalcin b->idiag = NULL; 4899f4259b30SLisandro Dalcin b->mdiag = NULL; 4900f4259b30SLisandro Dalcin b->ssor_work = NULL; 490171f1c65dSBarry Smith b->omega = 1.0; 490271f1c65dSBarry Smith b->fshift = 0.0; 490371f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4904bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4905a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 490617ab2063SBarry Smith 49079566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4908d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 49099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 49109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4911b3866ffcSBarry Smith #endif 49129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 49139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 49149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 49159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 49169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 49179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 49189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 49199779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 49209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4921191b95cbSRichard Tran Mills #endif 492234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 49239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 49249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 492602fe1965SBarry Smith #endif 4927d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4928d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4929d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4930d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4931d5e393b6SSuyash Tandon #endif 49323d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 49339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 49343d0639e7SStefano Zampini #endif 49359566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4936af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 49379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4938af8000cdSHong Zhang #endif 4939d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 49409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4941d24d4204SJose E. Roman #endif 494263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 49439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 49449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 494563c07aadSStefano Zampini #endif 49469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 49479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 49489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 49499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 495014e4dea2SJose E. Roman PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ)); 49519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 49529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 49539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 49549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 49559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 49569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 49579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 49589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 49599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 49609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 49619566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 49629566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49643ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 496517ab2063SBarry Smith } 496617ab2063SBarry Smith 4967b24902e0SBarry Smith /* 49683893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4969b24902e0SBarry Smith */ 4970d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4971d71ae5a4SJacob Faibussowitsch { 49722a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4973071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 497417ab2063SBarry Smith 49753a40ed3dSBarry Smith PetscFunctionBegin; 4976aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4977273d9f13SBarry Smith 4978d5f3da31SBarry Smith C->factortype = A->factortype; 4979f4259b30SLisandro Dalcin c->row = NULL; 4980f4259b30SLisandro Dalcin c->col = NULL; 4981f4259b30SLisandro Dalcin c->icol = NULL; 49826ad4291fSHong Zhang c->reallocs = 0; 4983bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 498417ab2063SBarry Smith 498569272f91SPierre Jolivet C->assembled = A->assembled; 498617ab2063SBarry Smith 498769272f91SPierre Jolivet if (A->preallocated) { 49889566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49899566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4990eec197d1SBarry Smith 499131fe6a7dSBarry Smith if (!A->hash_active) { 49929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49939566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49959566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 499617ab2063SBarry Smith 499717ab2063SBarry Smith /* allocate the matrix space */ 4998f77e22a1SHong Zhang if (mallocmatspace) { 49999f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a)); 50009f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j)); 50019f0612e4SBarry Smith PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i)); 50029566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 50039f0612e4SBarry Smith c->free_a = PETSC_TRUE; 50049f0612e4SBarry Smith c->free_ij = PETSC_TRUE; 500517ab2063SBarry Smith if (m > 0) { 50069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 5007be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 50082e5835c6SStefano Zampini const PetscScalar *aa; 50092e5835c6SStefano Zampini 50109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 50119566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 50129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 5013be6bf707SBarry Smith } else { 50149566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 501517ab2063SBarry Smith } 501608480c60SBarry Smith } 5017f77e22a1SHong Zhang } 501831fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 501931fe6a7dSBarry Smith } else { 502031fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 502131fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 502231fe6a7dSBarry Smith } 502317ab2063SBarry Smith 50246ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 5025416022c9SBarry Smith c->roworiented = a->roworiented; 5026416022c9SBarry Smith c->nonew = a->nonew; 5027416022c9SBarry Smith if (a->diag) { 50289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 50299566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 5030071fcb05SBarry Smith } else c->diag = NULL; 50312205254eSKarl Rupp 5032f4259b30SLisandro Dalcin c->solve_work = NULL; 5033f4259b30SLisandro Dalcin c->saved_values = NULL; 5034f4259b30SLisandro Dalcin c->idiag = NULL; 5035f4259b30SLisandro Dalcin c->ssor_work = NULL; 5036a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 50376ad4291fSHong Zhang 5038893ad86cSHong Zhang c->rmax = a->rmax; 5039416022c9SBarry Smith c->nz = a->nz; 50408ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 5041754ec7b1SSatish Balay 50426ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 50436ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 5044cd6b891eSBarry Smith if (a->compressedrow.use) { 50456ad4291fSHong Zhang i = a->compressedrow.nrows; 50469566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 50479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 50489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 504927ea64f8SHong Zhang } else { 505027ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 50510298fd71SBarry Smith c->compressedrow.i = NULL; 50520298fd71SBarry Smith c->compressedrow.rindex = NULL; 50536ad4291fSHong Zhang } 5054ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 5055e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 50564846f1f5SKris Buschelman 50579566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 505869272f91SPierre Jolivet } 50599566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 50603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 506117ab2063SBarry Smith } 506217ab2063SBarry Smith 5063d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5064d71ae5a4SJacob Faibussowitsch { 5065b24902e0SBarry Smith PetscFunctionBegin; 50669566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50679566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 506848a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50699566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50709566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5072b24902e0SBarry Smith } 5073b24902e0SBarry Smith 5074d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5075d71ae5a4SJacob Faibussowitsch { 507652f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 507752f91c60SVaclav Hapla 507852f91c60SVaclav Hapla PetscFunctionBegin; 507952f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 508052f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5081c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50829566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50839566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50849566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 508552f91c60SVaclav Hapla if (isbinary) { 50869566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 508752f91c60SVaclav Hapla } else if (ishdf5) { 508852f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50899566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 509052f91c60SVaclav Hapla #else 509152f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 509252f91c60SVaclav Hapla #endif 509352f91c60SVaclav Hapla } else { 509498921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 509552f91c60SVaclav Hapla } 50963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 509752f91c60SVaclav Hapla } 509852f91c60SVaclav Hapla 5099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5100d71ae5a4SJacob Faibussowitsch { 51013ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 51023ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5103fbdbba38SShri Abhyankar 5104fbdbba38SShri Abhyankar PetscFunctionBegin; 51059566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5106bbead8a2SBarry Smith 51073ea6fe3dSLisandro Dalcin /* read in matrix header */ 51089566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 510908401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 51109371c9d4SSatish Balay M = header[1]; 51119371c9d4SSatish Balay N = header[2]; 51129371c9d4SSatish Balay nz = header[3]; 511308401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 511408401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 511508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5116fbdbba38SShri Abhyankar 51173ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 51189566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 51193ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 51203ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 51213ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 51223ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 51233ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 51249566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 51259566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 51263ea6fe3dSLisandro Dalcin 51273ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 51289566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5129aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51303ea6fe3dSLisandro Dalcin 5131fbdbba38SShri Abhyankar /* read in row lengths */ 51329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 51339566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 51343ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 51359371c9d4SSatish Balay sum = 0; 51369371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 513708401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 51383ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 51399566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 51409566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5141aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 51423ea6fe3dSLisandro Dalcin /* store row lengths */ 51439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 51449566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5145fbdbba38SShri Abhyankar 51463ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 51479371c9d4SSatish Balay a->i[0] = 0; 51489371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 51493ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 51509566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 51513ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 51529566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5153fbdbba38SShri Abhyankar 51549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 51559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 51563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5157fbdbba38SShri Abhyankar } 5158fbdbba38SShri Abhyankar 5159d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5160d71ae5a4SJacob Faibussowitsch { 51617264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5162fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5163eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5164eeffb40dSHong Zhang PetscInt k; 5165eeffb40dSHong Zhang #endif 51667264ac53SSatish Balay 51673a40ed3dSBarry Smith PetscFunctionBegin; 5168bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5169d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5170ca44d042SBarry Smith *flg = PETSC_FALSE; 51713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5172bcd2baecSBarry Smith } 51737264ac53SSatish Balay 51747264ac53SSatish Balay /* if the a->i are the same */ 51759566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51763ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51777264ac53SSatish Balay 51787264ac53SSatish Balay /* if a->j are the same */ 51799566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51803ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5181bcd2baecSBarry Smith 51829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5184bcd2baecSBarry Smith /* if a->a are the same */ 5185eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5186eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5187fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5188eeffb40dSHong Zhang *flg = PETSC_FALSE; 51893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5190eeffb40dSHong Zhang } 5191eeffb40dSHong Zhang } 5192eeffb40dSHong Zhang #else 51939566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5194eeffb40dSHong Zhang #endif 51959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51987264ac53SSatish Balay } 519936db0b34SBarry Smith 520005869f15SSatish Balay /*@ 520111a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 520236db0b34SBarry Smith provided by the user. 520336db0b34SBarry Smith 5204d083f849SBarry Smith Collective 520536db0b34SBarry Smith 520636db0b34SBarry Smith Input Parameters: 520736db0b34SBarry Smith + comm - must be an MPI communicator of size 1 520836db0b34SBarry Smith . m - number of rows 520936db0b34SBarry Smith . n - number of columns 5210483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 521136db0b34SBarry Smith . j - column indices 521236db0b34SBarry Smith - a - matrix values 521336db0b34SBarry Smith 521436db0b34SBarry Smith Output Parameter: 521536db0b34SBarry Smith . mat - the matrix 521636db0b34SBarry Smith 521736db0b34SBarry Smith Level: intermediate 521836db0b34SBarry Smith 521936db0b34SBarry Smith Notes: 52202ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5221292fb18eSBarry Smith once the matrix is destroyed and not before 522236db0b34SBarry Smith 522336db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 522436db0b34SBarry Smith 52252ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 522636db0b34SBarry Smith 5227a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5228a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 52298eef79e4SBarry Smith as shown 52302ef1f0ffSBarry Smith .vb 52312ef1f0ffSBarry Smith 1 0 0 52322ef1f0ffSBarry Smith 2 0 3 52332ef1f0ffSBarry Smith 4 5 6 5234a4552177SSatish Balay 52352ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 52362ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 52372ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 52382ef1f0ffSBarry Smith .ve 5239a4552177SSatish Balay 52401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 524136db0b34SBarry Smith @*/ 5242d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5243d71ae5a4SJacob Faibussowitsch { 5244cbcfb4deSHong Zhang PetscInt ii; 524536db0b34SBarry Smith Mat_SeqAIJ *aij; 5246cbcfb4deSHong Zhang PetscInt jj; 524736db0b34SBarry Smith 524836db0b34SBarry Smith PetscFunctionBegin; 5249aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 52509566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52519566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52529566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 52539566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5255ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 52569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 52579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5258ab93d7beSBarry Smith 525936db0b34SBarry Smith aij->i = i; 526036db0b34SBarry Smith aij->j = j; 526136db0b34SBarry Smith aij->a = a; 526236db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5263e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5264e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 526536db0b34SBarry Smith 5266cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 526736db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 526876bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5269aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52709985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 527108401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 527208401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52739985e31cSBarry Smith } 527436db0b34SBarry Smith } 527576bd3646SJed Brown } 527676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 527736db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 527808401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5279da0802e2SStefano Zampini PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1); 528036db0b34SBarry Smith } 528176bd3646SJed Brown } 528236db0b34SBarry Smith 52839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 528636db0b34SBarry Smith } 5287cbc6b225SStefano Zampini 5288f62e3866SBarry Smith /*@ 528911a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52908a0b0e6bSVictor Minden provided by the user. 52918a0b0e6bSVictor Minden 5292d083f849SBarry Smith Collective 52938a0b0e6bSVictor Minden 52948a0b0e6bSVictor Minden Input Parameters: 52958a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52968a0b0e6bSVictor Minden . m - number of rows 52978a0b0e6bSVictor Minden . n - number of columns 52988a0b0e6bSVictor Minden . i - row indices 52998a0b0e6bSVictor Minden . j - column indices 53001230e6d1SVictor Minden . a - matrix values 53011230e6d1SVictor Minden . nz - number of nonzeros 53022ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 53038a0b0e6bSVictor Minden 53048a0b0e6bSVictor Minden Output Parameter: 53058a0b0e6bSVictor Minden . mat - the matrix 53068a0b0e6bSVictor Minden 53078a0b0e6bSVictor Minden Level: intermediate 53088a0b0e6bSVictor Minden 5309f62e3866SBarry Smith Example: 5310f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 53119e99939fSJunchao Zhang .vb 53128a0b0e6bSVictor Minden 1 0 0 53138a0b0e6bSVictor Minden 2 0 3 53148a0b0e6bSVictor Minden 4 5 6 53158a0b0e6bSVictor Minden 53168a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 53178a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 53188a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 53199e99939fSJunchao Zhang .ve 5320fe59aa6dSJacob Faibussowitsch 53212ef1f0ffSBarry Smith Note: 5322d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5323d7547e51SJunchao Zhang and are particularly useful in iterative applications. 53248a0b0e6bSVictor Minden 53251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 53268a0b0e6bSVictor Minden @*/ 5327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5328d71ae5a4SJacob Faibussowitsch { 5329d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 53308a0b0e6bSVictor Minden 53318a0b0e6bSVictor Minden PetscFunctionBegin; 53329566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5333ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 53349566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 53359566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 53369566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 53379566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 53381230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 53391230e6d1SVictor Minden if (idx) { 53401230e6d1SVictor Minden row = i[ii] - 1; 53411230e6d1SVictor Minden col = j[ii] - 1; 53421230e6d1SVictor Minden } else { 53431230e6d1SVictor Minden row = i[ii]; 53441230e6d1SVictor Minden col = j[ii]; 53458a0b0e6bSVictor Minden } 53469566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 53478a0b0e6bSVictor Minden } 53489566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 53499566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 53509566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 53513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53528a0b0e6bSVictor Minden } 535336db0b34SBarry Smith 5354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5355d71ae5a4SJacob Faibussowitsch { 5356acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5357acf2f550SJed Brown 5358acf2f550SJed Brown PetscFunctionBegin; 5359acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5360acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53612205254eSKarl Rupp 53629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5364acf2f550SJed Brown } 5365acf2f550SJed Brown 5366d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5367d71ae5a4SJacob Faibussowitsch { 53689c8f2541SHong Zhang PetscFunctionBegin; 53699566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53719c8f2541SHong Zhang } 53729c8f2541SHong Zhang 537381824310SBarry Smith /* 537453dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 537553dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 537653dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 537753dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 537853dd7562SDmitry Karpeev */ 5379d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5380d71ae5a4SJacob Faibussowitsch { 538153dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 538253dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 538353dd7562SDmitry Karpeev PetscBool seqaij; 538453dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 538553dd7562SDmitry Karpeev PetscScalar v; 538653dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 538753dd7562SDmitry Karpeev 538853dd7562SDmitry Karpeev PetscFunctionBegin; 53893ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 539053dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53919566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 539228b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 539353dd7562SDmitry Karpeev if (rowemb) { 53949566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 539508401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 539653dd7562SDmitry Karpeev } else { 539708401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 539853dd7562SDmitry Karpeev } 539953dd7562SDmitry Karpeev if (colemb) { 54009566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 540108401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 540253dd7562SDmitry Karpeev } else { 540308401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 540453dd7562SDmitry Karpeev } 540553dd7562SDmitry Karpeev 5406f4f49eeaSPierre Jolivet Baij = (Mat_SeqAIJ *)B->data; 540753dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 54089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5409ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 54109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 54119566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 541253dd7562SDmitry Karpeev } 541348a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 541453dd7562SDmitry Karpeev count = 0; 541553dd7562SDmitry Karpeev rowindices = NULL; 541653dd7562SDmitry Karpeev colindices = NULL; 541748a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 541848a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 541953dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 542053dd7562SDmitry Karpeev PetscInt row; 542153dd7562SDmitry Karpeev row = i; 542253dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 542353dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 542453dd7562SDmitry Karpeev PetscInt col; 542553dd7562SDmitry Karpeev col = Baij->j[count]; 542653dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 542753dd7562SDmitry Karpeev v = Baij->a[count]; 54289566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 542953dd7562SDmitry Karpeev ++count; 543053dd7562SDmitry Karpeev } 543153dd7562SDmitry Karpeev } 543253dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 543353dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 543453dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 543553dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 543653dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 54373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 543853dd7562SDmitry Karpeev } 543953dd7562SDmitry Karpeev 544058c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5441dec0b466SHong Zhang { 5442dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5443dec0b466SHong Zhang MatScalar *aa = a->a; 5444dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5445dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5446dec0b466SHong Zhang 5447dec0b466SHong Zhang PetscFunctionBegin; 5448dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5449dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5450dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5451dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5452dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 545358c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5454dec0b466SHong Zhang else { 5455dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5456dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5457dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5458dec0b466SHong Zhang } 5459dec0b466SHong Zhang } 5460dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5461dec0b466SHong Zhang fshift_prev = fshift; 5462dec0b466SHong Zhang /* reset ilen and imax for each row */ 5463dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5464dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5465dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5466dec0b466SHong Zhang } 5467312eded4SPierre Jolivet if (fshift) { 5468dec0b466SHong Zhang if (m) { 5469dec0b466SHong Zhang ai[m] -= fshift; 5470dec0b466SHong Zhang a->nz = ai[m]; 5471dec0b466SHong Zhang } 5472dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5473312eded4SPierre Jolivet A->nonzerostate++; 5474dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5475dec0b466SHong Zhang a->rmax = rmax; 5476dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5477dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5478dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5479312eded4SPierre Jolivet } 54803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5481dec0b466SHong Zhang } 5482dec0b466SHong Zhang 54834099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54844099cc6bSBarry Smith 5485cc4c1da9SBarry Smith /*@ 548611a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54874099cc6bSBarry Smith 5488c3339decSBarry Smith Collective 54894099cc6bSBarry Smith 54904099cc6bSBarry Smith Input Parameters: 54914099cc6bSBarry Smith + mat - the matrix object 54924099cc6bSBarry Smith - matype - matrix type 54934099cc6bSBarry Smith 54944099cc6bSBarry Smith Options Database Key: 54954e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54964099cc6bSBarry Smith 54974099cc6bSBarry Smith Level: intermediate 54984099cc6bSBarry Smith 5499fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 55004099cc6bSBarry Smith @*/ 5501d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5502d71ae5a4SJacob Faibussowitsch { 55034099cc6bSBarry Smith PetscBool sametype; 55045f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 55054099cc6bSBarry Smith 55064099cc6bSBarry Smith PetscFunctionBegin; 55074099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 55089566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 55093ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 55104099cc6bSBarry Smith 55119566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 55126adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 55139566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 55143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55154099cc6bSBarry Smith } 55164099cc6bSBarry Smith 55174099cc6bSBarry Smith /*@C 551811a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 55194099cc6bSBarry Smith 5520cc4c1da9SBarry Smith Not Collective, No Fortran Support 55214099cc6bSBarry Smith 55224099cc6bSBarry Smith Input Parameters: 5523fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 55244099cc6bSBarry Smith - function - routine to convert to subtype 55254099cc6bSBarry Smith 55262ef1f0ffSBarry Smith Level: advanced 55272ef1f0ffSBarry Smith 55284099cc6bSBarry Smith Notes: 552911a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 55304099cc6bSBarry Smith 55314099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 55324099cc6bSBarry Smith $ -mat_seqaij_type my_mat 55334099cc6bSBarry Smith 55341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 55354099cc6bSBarry Smith @*/ 5536d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5537d71ae5a4SJacob Faibussowitsch { 55384099cc6bSBarry Smith PetscFunctionBegin; 55399566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 55409566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 55413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55424099cc6bSBarry Smith } 55434099cc6bSBarry Smith 55444099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 55454099cc6bSBarry Smith 55464099cc6bSBarry Smith /*@C 554711a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 55484099cc6bSBarry Smith 55494099cc6bSBarry Smith Not Collective 55504099cc6bSBarry Smith 55514099cc6bSBarry Smith Level: advanced 55524099cc6bSBarry Smith 55532ef1f0ffSBarry Smith Note: 55542ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 55552ef1f0ffSBarry Smith 55561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 55574099cc6bSBarry Smith @*/ 5558d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5559d71ae5a4SJacob Faibussowitsch { 55604099cc6bSBarry Smith PetscFunctionBegin; 55613ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55624099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55634099cc6bSBarry Smith 55649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55679779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55689566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5569485f9817SRichard Tran Mills #endif 55705063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55725063d097SStefano Zampini #endif 5573d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5574d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5575d5e393b6SSuyash Tandon #endif 55765063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55785063d097SStefano Zampini #endif 55794099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55814099cc6bSBarry Smith #endif 55823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55834099cc6bSBarry Smith } 558453dd7562SDmitry Karpeev 558553dd7562SDmitry Karpeev /* 558681824310SBarry Smith Special version for direct calls from Fortran 558781824310SBarry Smith */ 558881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 558981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 559081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 559181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 559281824310SBarry Smith #endif 559381824310SBarry Smith 559481824310SBarry Smith /* Change these macros so can be used in void function */ 559598921bdaSJacob Faibussowitsch 559698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55979566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55989566063dSJacob Faibussowitsch #undef PetscCall 55999371c9d4SSatish Balay #define PetscCall(...) \ 56009371c9d4SSatish Balay do { \ 56015f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 560298921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 560398921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 560498921bdaSJacob Faibussowitsch return; \ 560598921bdaSJacob Faibussowitsch } \ 560698921bdaSJacob Faibussowitsch } while (0) 560798921bdaSJacob Faibussowitsch 560898921bdaSJacob Faibussowitsch #undef SETERRQ 56099371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 56109371c9d4SSatish Balay do { \ 561198921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 561298921bdaSJacob Faibussowitsch return; \ 561398921bdaSJacob Faibussowitsch } while (0) 561481824310SBarry Smith 5615d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5616d71ae5a4SJacob Faibussowitsch { 561781824310SBarry Smith Mat A = *AA; 561881824310SBarry Smith PetscInt m = *mm, n = *nn; 561981824310SBarry Smith InsertMode is = *isis; 562081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 562181824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 562281824310SBarry Smith PetscInt *imax, *ai, *ailen; 562381824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 562454f21887SBarry Smith MatScalar *ap, value, *aa; 5625ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5626ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 562781824310SBarry Smith 562881824310SBarry Smith PetscFunctionBegin; 56294994cf47SJed Brown MatCheckPreallocated(A, 1); 563081824310SBarry Smith imax = a->imax; 563181824310SBarry Smith ai = a->i; 563281824310SBarry Smith ailen = a->ilen; 563381824310SBarry Smith aj = a->j; 563481824310SBarry Smith aa = a->a; 563581824310SBarry Smith 563681824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 563781824310SBarry Smith row = im[k]; 563881824310SBarry Smith if (row < 0) continue; 56395f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 56409371c9d4SSatish Balay rp = aj + ai[row]; 56419371c9d4SSatish Balay ap = aa + ai[row]; 56429371c9d4SSatish Balay rmax = imax[row]; 56439371c9d4SSatish Balay nrow = ailen[row]; 564481824310SBarry Smith low = 0; 564581824310SBarry Smith high = nrow; 564681824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 564781824310SBarry Smith if (in[l] < 0) continue; 56485f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 564981824310SBarry Smith col = in[l]; 56502205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 56512205254eSKarl Rupp else value = v[k + l * m]; 56522205254eSKarl Rupp 565381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 565481824310SBarry Smith 56552205254eSKarl Rupp if (col <= lastcol) low = 0; 56562205254eSKarl Rupp else high = nrow; 565781824310SBarry Smith lastcol = col; 565881824310SBarry Smith while (high - low > 5) { 565981824310SBarry Smith t = (low + high) / 2; 566081824310SBarry Smith if (rp[t] > col) high = t; 566181824310SBarry Smith else low = t; 566281824310SBarry Smith } 566381824310SBarry Smith for (i = low; i < high; i++) { 566481824310SBarry Smith if (rp[i] > col) break; 566581824310SBarry Smith if (rp[i] == col) { 566681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 566781824310SBarry Smith else ap[i] = value; 566881824310SBarry Smith goto noinsert; 566981824310SBarry Smith } 567081824310SBarry Smith } 567181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 567281824310SBarry Smith if (nonew == 1) goto noinsert; 56735f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5674fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56759371c9d4SSatish Balay N = nrow++ - 1; 56769371c9d4SSatish Balay a->nz++; 56779371c9d4SSatish Balay high++; 567881824310SBarry Smith /* shift up all the later entries in this row */ 567981824310SBarry Smith for (ii = N; ii >= i; ii--) { 568081824310SBarry Smith rp[ii + 1] = rp[ii]; 568181824310SBarry Smith ap[ii + 1] = ap[ii]; 568281824310SBarry Smith } 568381824310SBarry Smith rp[i] = col; 568481824310SBarry Smith ap[i] = value; 568581824310SBarry Smith noinsert:; 568681824310SBarry Smith low = i + 1; 568781824310SBarry Smith } 568881824310SBarry Smith ailen[row] = nrow; 568981824310SBarry Smith } 569081824310SBarry Smith PetscFunctionReturnVoid(); 569181824310SBarry Smith } 569298921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 569398921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 569498921bdaSJacob Faibussowitsch * original definitions */ 56959566063dSJacob Faibussowitsch #undef PetscCall 569698921bdaSJacob Faibussowitsch #undef SETERRQ 5697