1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1226cec326SBarry Smith #define TYPE AIJ 1326cec326SBarry Smith #define TYPE_BS 1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 1626cec326SBarry Smith #undef TYPE 1726cec326SBarry Smith #undef TYPE_BS 1826cec326SBarry Smith 19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 20d71ae5a4SJacob Faibussowitsch { 214099cc6bSBarry Smith PetscBool flg; 224099cc6bSBarry Smith char type[256]; 234099cc6bSBarry Smith 244099cc6bSBarry Smith PetscFunctionBegin; 25d0609cedSBarry Smith PetscObjectOptionsBegin((PetscObject)A); 269566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg)); 279566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A, type)); 28d0609cedSBarry Smith PetscOptionsEnd(); 293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 304099cc6bSBarry Smith } 314099cc6bSBarry Smith 32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions) 33d71ae5a4SJacob Faibussowitsch { 340716a85fSBarry Smith PetscInt i, m, n; 350716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 360716a85fSBarry Smith 370716a85fSBarry Smith PetscFunctionBegin; 389566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &m, &n)); 399566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions, n)); 400716a85fSBarry Smith if (type == NORM_2) { 41ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]); 420716a85fSBarry Smith } else if (type == NORM_1) { 43ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } else if (type == NORM_INFINITY) { 45ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]); 46857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 47ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 49ad540459SPierre Jolivet for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 506adde796SStefano Zampini } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type"); 510716a85fSBarry Smith 520716a85fSBarry Smith if (type == NORM_2) { 53a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 54857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 55a873a8cdSSam Reynolds for (i = 0; i < n; i++) reductions[i] /= m; 560716a85fSBarry Smith } 573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 580716a85fSBarry Smith } 590716a85fSBarry Smith 60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is) 61d71ae5a4SJacob Faibussowitsch { 623a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 633a062f41SBarry Smith PetscInt i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs; 643a062f41SBarry Smith const PetscInt *jj = a->j, *ii = a->i; 653a062f41SBarry Smith PetscInt *rows; 663a062f41SBarry Smith 673a062f41SBarry Smith PetscFunctionBegin; 683a062f41SBarry Smith for (i = 0; i < m; i++) { 69ad540459SPierre Jolivet if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++; 703a062f41SBarry Smith } 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i = 0; i < m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 799566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is)); 803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows) 84d71ae5a4SJacob Faibussowitsch { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 86fff043a9SJunchao Zhang const MatScalar *aa; 876ce1633cSBarry Smith PetscInt i, m = A->rmap->n, cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i, *jj = a->j, *diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith 916ce1633cSBarry Smith PetscFunctionBegin; 929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 939566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i = 0; i < m; i++) { 96ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++; 976ce1633cSBarry Smith } 989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt, &rows)); 996ce1633cSBarry Smith cnt = 0; 1006ce1633cSBarry Smith for (i = 0; i < m; i++) { 101ad540459SPierre Jolivet if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i; 1026ce1633cSBarry Smith } 103f1f41ecbSJed Brown *nrows = cnt; 104f1f41ecbSJed Brown *zrows = rows; 1059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107f1f41ecbSJed Brown } 108f1f41ecbSJed Brown 109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows) 110d71ae5a4SJacob Faibussowitsch { 111f1f41ecbSJed Brown PetscInt nrows, *rows; 112f1f41ecbSJed Brown 113f1f41ecbSJed Brown PetscFunctionBegin; 1140298fd71SBarry Smith *zrows = NULL; 1159566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows)); 1169566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows)); 1173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1186ce1633cSBarry Smith } 1196ce1633cSBarry Smith 120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows) 121d71ae5a4SJacob Faibussowitsch { 122b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 123b3a44c85SBarry Smith const MatScalar *aa; 124b3a44c85SBarry Smith PetscInt m = A->rmap->n, cnt = 0; 125b3a44c85SBarry Smith const PetscInt *ii; 126b3a44c85SBarry Smith PetscInt n, i, j, *rows; 127b3a44c85SBarry Smith 128b3a44c85SBarry Smith PetscFunctionBegin; 1299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 130f4259b30SLisandro Dalcin *keptrows = NULL; 131b3a44c85SBarry Smith ii = a->i; 132b3a44c85SBarry Smith for (i = 0; i < m; i++) { 133b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 134b3a44c85SBarry Smith if (!n) { 135b3a44c85SBarry Smith cnt++; 136b3a44c85SBarry Smith goto ok1; 137b3a44c85SBarry Smith } 1382e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 139b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 140b3a44c85SBarry Smith } 141b3a44c85SBarry Smith cnt++; 142b3a44c85SBarry Smith ok1:; 143b3a44c85SBarry Smith } 1442e5835c6SStefano Zampini if (!cnt) { 1459566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1472e5835c6SStefano Zampini } 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows)); 149b3a44c85SBarry Smith cnt = 0; 150b3a44c85SBarry Smith for (i = 0; i < m; i++) { 151b3a44c85SBarry Smith n = ii[i + 1] - ii[i]; 152b3a44c85SBarry Smith if (!n) continue; 1532e5835c6SStefano Zampini for (j = ii[i]; j < ii[i + 1]; j++) { 154b3a44c85SBarry Smith if (aa[j] != 0.0) { 155b3a44c85SBarry Smith rows[cnt++] = i; 156b3a44c85SBarry Smith break; 157b3a44c85SBarry Smith } 158b3a44c85SBarry Smith } 159b3a44c85SBarry Smith } 1609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 1619566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows)); 1623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 163b3a44c85SBarry Smith } 164b3a44c85SBarry Smith 165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is) 166d71ae5a4SJacob Faibussowitsch { 16779299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)Y->data; 16899e65526SBarry Smith PetscInt i, m = Y->rmap->n; 16999e65526SBarry Smith const PetscInt *diag; 1702e5835c6SStefano Zampini MatScalar *aa; 17199e65526SBarry Smith const PetscScalar *v; 172ace3abfcSBarry Smith PetscBool missing; 17379299369SBarry Smith 17479299369SBarry Smith PetscFunctionBegin; 17509f38230SBarry Smith if (Y->assembled) { 1769566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL)); 17709f38230SBarry Smith if (!missing) { 17879299369SBarry Smith diag = aij->diag; 1799566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D, &v)); 1809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &aa)); 18179299369SBarry Smith if (is == INSERT_VALUES) { 182ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] = v[i]; 18379299369SBarry Smith } else { 184ad540459SPierre Jolivet for (i = 0; i < m; i++) aa[diag[i]] += v[i]; 18579299369SBarry Smith } 1869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &aa)); 1879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D, &v)); 1883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18979299369SBarry Smith } 1909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 19109f38230SBarry Smith } 1929566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y, D, is)); 1933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 19409f38230SBarry Smith } 19579299369SBarry Smith 196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 197d71ae5a4SJacob Faibussowitsch { 198416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 19997f1f81fSBarry Smith PetscInt i, ishift; 20017ab2063SBarry Smith 2013a40ed3dSBarry Smith PetscFunctionBegin; 202f1f2ae84SBarry Smith if (m) *m = A->rmap->n; 2033ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 204bfeeae90SHong Zhang ishift = 0; 205b94d7dedSBarry Smith if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) { 2069566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja)); 207bfeeae90SHong Zhang } else if (oshift == 1) { 2081a83f524SJed Brown PetscInt *tia; 209d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2103b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &tia)); 2121a83f524SJed Brown for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1; 2131a83f524SJed Brown *ia = tia; 214ecc77c7aSBarry Smith if (ja) { 2151a83f524SJed Brown PetscInt *tja; 2169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz + 1, &tja)); 2171a83f524SJed Brown for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1; 2181a83f524SJed Brown *ja = tja; 219ecc77c7aSBarry Smith } 2206945ee14SBarry Smith } else { 221ecc77c7aSBarry Smith *ia = a->i; 222ecc77c7aSBarry Smith if (ja) *ja = a->j; 223a2ce50c7SBarry Smith } 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 225a2744918SBarry Smith } 226a2744918SBarry Smith 227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 228d71ae5a4SJacob Faibussowitsch { 2293a40ed3dSBarry Smith PetscFunctionBegin; 2303ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 231b94d7dedSBarry Smith if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) { 2329566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2339566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 234bcd2baecSBarry Smith } 2353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23617ab2063SBarry Smith } 23717ab2063SBarry Smith 238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 239d71ae5a4SJacob Faibussowitsch { 2403b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 241d0f46423SBarry Smith PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 24297f1f81fSBarry Smith PetscInt nz = a->i[m], row, *jj, mr, col; 2433b2fbd54SBarry Smith 2443a40ed3dSBarry Smith PetscFunctionBegin; 245899cda47SBarry Smith *nn = n; 2463ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2473b2fbd54SBarry Smith if (symmetric) { 2489566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja)); 2493b2fbd54SBarry Smith } else { 2509566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 2519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 2529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 2533b2fbd54SBarry Smith jj = a->j; 254ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 2553b2fbd54SBarry Smith cia[0] = oshift; 256ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 2579566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 2583b2fbd54SBarry Smith jj = a->j; 259a93ec695SBarry Smith for (row = 0; row < m; row++) { 260a93ec695SBarry Smith mr = a->i[row + 1] - a->i[row]; 261a93ec695SBarry Smith for (i = 0; i < mr; i++) { 262bfeeae90SHong Zhang col = *jj++; 2632205254eSKarl Rupp 2643b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2653b2fbd54SBarry Smith } 2663b2fbd54SBarry Smith } 2679566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2689371c9d4SSatish Balay *ia = cia; 2699371c9d4SSatish Balay *ja = cja; 2703b2fbd54SBarry Smith } 2713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2723b2fbd54SBarry Smith } 2733b2fbd54SBarry Smith 274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 275d71ae5a4SJacob Faibussowitsch { 2763a40ed3dSBarry Smith PetscFunctionBegin; 2773ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 2783b2fbd54SBarry Smith 2799566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2809566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith 2847cee066cSHong Zhang /* 2857cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 2867cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 287040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 2887cee066cSHong Zhang */ 289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 290d71ae5a4SJacob Faibussowitsch { 2917cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2927cee066cSHong Zhang PetscInt i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n; 293071fcb05SBarry Smith PetscInt nz = a->i[m], row, mr, col, tmp; 2947cee066cSHong Zhang PetscInt *cspidx; 295071fcb05SBarry Smith const PetscInt *jj; 2967cee066cSHong Zhang 2977cee066cSHong Zhang PetscFunctionBegin; 2987cee066cSHong Zhang *nn = n; 2993ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 300625f6d37SHong Zhang 3019566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n, &collengths)); 3029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n + 1, &cia)); 3039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cja)); 3049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &cspidx)); 3057cee066cSHong Zhang jj = a->j; 306ad540459SPierre Jolivet for (i = 0; i < nz; i++) collengths[jj[i]]++; 3077cee066cSHong Zhang cia[0] = oshift; 308ad540459SPierre Jolivet for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i]; 3099566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths, n)); 3107cee066cSHong Zhang jj = a->j; 3117cee066cSHong Zhang for (row = 0; row < m; row++) { 3127cee066cSHong Zhang mr = a->i[row + 1] - a->i[row]; 3137cee066cSHong Zhang for (i = 0; i < mr; i++) { 3147cee066cSHong Zhang col = *jj++; 315071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 316071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 317071fcb05SBarry Smith cja[tmp] = row + oshift; 3187cee066cSHong Zhang } 3197cee066cSHong Zhang } 3209566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 321071fcb05SBarry Smith *ia = cia; 322071fcb05SBarry Smith *ja = cja; 3237cee066cSHong Zhang *spidx = cspidx; 3243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3257cee066cSHong Zhang } 3267cee066cSHong Zhang 327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done) 328d71ae5a4SJacob Faibussowitsch { 3297cee066cSHong Zhang PetscFunctionBegin; 3309566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done)); 3319566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3337cee066cSHong Zhang } 3347cee066cSHong Zhang 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[]) 336d71ae5a4SJacob Faibussowitsch { 33787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 33887d4246cSBarry Smith PetscInt *ai = a->i; 339fff043a9SJunchao Zhang PetscScalar *aa; 34087d4246cSBarry Smith 34187d4246cSBarry Smith PetscFunctionBegin; 3429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 3439566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row])); 3449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34687d4246cSBarry Smith } 34787d4246cSBarry Smith 348bd04181cSBarry Smith /* 349bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 350bd04181cSBarry Smith 351bd04181cSBarry Smith - a single row of values is set with each call 352bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 353bd04181cSBarry Smith - the values are always added to the matrix, not set 354bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 355bd04181cSBarry Smith 3561f763a69SBarry Smith This does NOT assume the global column indices are sorted 357bd04181cSBarry Smith 3581f763a69SBarry Smith */ 359bd04181cSBarry Smith 360af0996ceSBarry Smith #include <petsc/private/isimpl.h> 361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 362d71ae5a4SJacob Faibussowitsch { 363189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3641f763a69SBarry Smith PetscInt low, high, t, row, nrow, i, col, l; 3651f763a69SBarry Smith const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j; 3661f763a69SBarry Smith PetscInt lastcol = -1; 367fff043a9SJunchao Zhang MatScalar *ap, value, *aa; 368189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices; 369189e4007SBarry Smith 370fff043a9SJunchao Zhang PetscFunctionBegin; 3719566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 372f38dd0b8SBarry Smith row = ridx[im[0]]; 3731f763a69SBarry Smith rp = aj + ai[row]; 3741f763a69SBarry Smith ap = aa + ai[row]; 3751f763a69SBarry Smith nrow = ailen[row]; 376189e4007SBarry Smith low = 0; 377189e4007SBarry Smith high = nrow; 378189e4007SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 379189e4007SBarry Smith col = cidx[in[l]]; 380f38dd0b8SBarry Smith value = v[l]; 381189e4007SBarry Smith 382189e4007SBarry Smith if (col <= lastcol) low = 0; 383189e4007SBarry Smith else high = nrow; 384189e4007SBarry Smith lastcol = col; 385189e4007SBarry Smith while (high - low > 5) { 386189e4007SBarry Smith t = (low + high) / 2; 387189e4007SBarry Smith if (rp[t] > col) high = t; 388189e4007SBarry Smith else low = t; 389189e4007SBarry Smith } 390189e4007SBarry Smith for (i = low; i < high; i++) { 391189e4007SBarry Smith if (rp[i] == col) { 3921f763a69SBarry Smith ap[i] += value; 393189e4007SBarry Smith low = i + 1; 3941f763a69SBarry Smith break; 395189e4007SBarry Smith } 396189e4007SBarry Smith } 397189e4007SBarry Smith } 3989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 3993ba16761SJacob Faibussowitsch return PETSC_SUCCESS; 400189e4007SBarry Smith } 401189e4007SBarry Smith 402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 403d71ae5a4SJacob Faibussowitsch { 404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 405e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 40697f1f81fSBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 407e2ee6c50SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, lastcol = -1; 408ce496241SStefano Zampini MatScalar *ap = NULL, value = 0.0, *aa; 409ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 410ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 41117ab2063SBarry Smith 4123a40ed3dSBarry Smith PetscFunctionBegin; 4139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 41417ab2063SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 415416022c9SBarry Smith row = im[k]; 4165ef9f2a5SBarry Smith if (row < 0) continue; 4176bdcaf15SBarry Smith PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 418*8e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 419*8e3a54c0SPierre Jolivet if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]); 4209371c9d4SSatish Balay rmax = imax[row]; 4219371c9d4SSatish Balay nrow = ailen[row]; 422416022c9SBarry Smith low = 0; 423c71e6ed7SBarry Smith high = nrow; 42417ab2063SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 4255ef9f2a5SBarry Smith if (in[l] < 0) continue; 4266bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 427bfeeae90SHong Zhang col = in[l]; 428071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m]; 429071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 43036db0b34SBarry Smith 4312205254eSKarl Rupp if (col <= lastcol) low = 0; 4322205254eSKarl Rupp else high = nrow; 433e2ee6c50SBarry Smith lastcol = col; 434416022c9SBarry Smith while (high - low > 5) { 435416022c9SBarry Smith t = (low + high) / 2; 436416022c9SBarry Smith if (rp[t] > col) high = t; 437416022c9SBarry Smith else low = t; 43817ab2063SBarry Smith } 439416022c9SBarry Smith for (i = low; i < high; i++) { 44017ab2063SBarry Smith if (rp[i] > col) break; 44117ab2063SBarry Smith if (rp[i] == col) { 442876c6284SHong Zhang if (!A->structure_only) { 4430c0d7e18SFande Kong if (is == ADD_VALUES) { 4440c0d7e18SFande Kong ap[i] += value; 4450c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4469371c9d4SSatish Balay } else ap[i] = value; 447720833daSHong Zhang } 448e44c0bd4SBarry Smith low = i + 1; 44917ab2063SBarry Smith goto noinsert; 45017ab2063SBarry Smith } 45117ab2063SBarry Smith } 452dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 453c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 45408401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col); 455720833daSHong Zhang if (A->structure_only) { 456876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar); 457720833daSHong Zhang } else { 458fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 459720833daSHong Zhang } 4609371c9d4SSatish Balay N = nrow++ - 1; 4619371c9d4SSatish Balay a->nz++; 4629371c9d4SSatish Balay high++; 463416022c9SBarry Smith /* shift up all the later entries in this row */ 4649566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 46517ab2063SBarry Smith rp[i] = col; 466580bdb30SBarry Smith if (!A->structure_only) { 4679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1)); 468580bdb30SBarry Smith ap[i] = value; 469580bdb30SBarry Smith } 470416022c9SBarry Smith low = i + 1; 471e56f5c9eSBarry Smith A->nonzerostate++; 472e44c0bd4SBarry Smith noinsert:; 47317ab2063SBarry Smith } 47417ab2063SBarry Smith ailen[row] = nrow; 47517ab2063SBarry Smith } 4769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 4773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 47817ab2063SBarry Smith } 47917ab2063SBarry Smith 480ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 481d71ae5a4SJacob Faibussowitsch { 48219b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 48319b08ed1SBarry Smith PetscInt *rp, k, row; 48419b08ed1SBarry Smith PetscInt *ai = a->i; 48519b08ed1SBarry Smith PetscInt *aj = a->j; 486fff043a9SJunchao Zhang MatScalar *aa, *ap; 48719b08ed1SBarry Smith 48819b08ed1SBarry Smith PetscFunctionBegin; 48928b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix."); 49008401ef6SPierre Jolivet PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz); 491fff043a9SJunchao Zhang 4929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 49319b08ed1SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 49419b08ed1SBarry Smith row = im[k]; 49519b08ed1SBarry Smith rp = aj + ai[row]; 496*8e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 49719b08ed1SBarry Smith 4989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 49919b08ed1SBarry Smith if (!A->structure_only) { 50019b08ed1SBarry Smith if (v) { 5019566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 50219b08ed1SBarry Smith v += n; 50319b08ed1SBarry Smith } else { 5049566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 50519b08ed1SBarry Smith } 50619b08ed1SBarry Smith } 50719b08ed1SBarry Smith a->ilen[row] = n; 50819b08ed1SBarry Smith a->imax[row] = n; 50919b08ed1SBarry Smith a->i[row + 1] = a->i[row] + n; 51019b08ed1SBarry Smith a->nz += n; 51119b08ed1SBarry Smith } 5129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51419b08ed1SBarry Smith } 51519b08ed1SBarry Smith 51619b08ed1SBarry Smith /*@ 51719b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 51819b08ed1SBarry Smith 51919b08ed1SBarry Smith Input Parameters: 52011a5261eSBarry Smith + A - the `MATSEQAIJ` matrix 52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 52219b08ed1SBarry Smith 52319b08ed1SBarry Smith Level: advanced 52419b08ed1SBarry Smith 52519b08ed1SBarry Smith Notes: 52619b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 52711a5261eSBarry Smith Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used 52819b08ed1SBarry Smith as always with multiple matrix assemblies. 52919b08ed1SBarry Smith 5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()` 53119b08ed1SBarry Smith @*/ 532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal) 533d71ae5a4SJacob Faibussowitsch { 53419b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 53519b08ed1SBarry Smith 53619b08ed1SBarry Smith PetscFunctionBegin; 5379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5389566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 53919b08ed1SBarry Smith a->maxnz = nztotal; 5404dfa11a4SJacob Faibussowitsch if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); } 54119b08ed1SBarry Smith if (!a->ilen) { 5429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n, &a->ilen)); 54319b08ed1SBarry Smith } else { 5449566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt))); 54519b08ed1SBarry Smith } 54619b08ed1SBarry Smith 54719b08ed1SBarry Smith /* allocate the matrix space */ 54819b08ed1SBarry Smith if (A->structure_only) { 5499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal, &a->j)); 5509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i)); 55119b08ed1SBarry Smith } else { 5529566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i)); 55319b08ed1SBarry Smith } 55419b08ed1SBarry Smith a->i[0] = 0; 55519b08ed1SBarry Smith if (A->structure_only) { 55619b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 55719b08ed1SBarry Smith a->free_a = PETSC_FALSE; 55819b08ed1SBarry Smith } else { 55919b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 56019b08ed1SBarry Smith a->free_a = PETSC_TRUE; 56119b08ed1SBarry Smith } 56219b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 56319b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 56419b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 5653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56619b08ed1SBarry Smith } 56719b08ed1SBarry Smith 568ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 569d71ae5a4SJacob Faibussowitsch { 570071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 571071fcb05SBarry Smith PetscInt *rp, k, row; 572071fcb05SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 573071fcb05SBarry Smith PetscInt *aj = a->j; 574fff043a9SJunchao Zhang MatScalar *aa, *ap; 575071fcb05SBarry Smith 576071fcb05SBarry Smith PetscFunctionBegin; 5779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 578071fcb05SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 579071fcb05SBarry Smith row = im[k]; 5806bdcaf15SBarry Smith PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n); 581071fcb05SBarry Smith rp = aj + ai[row]; 582071fcb05SBarry Smith ap = aa + ai[row]; 58348a46eb9SPierre Jolivet if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt))); 584071fcb05SBarry Smith if (!A->structure_only) { 585071fcb05SBarry Smith if (v) { 5869566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar))); 587071fcb05SBarry Smith v += n; 588071fcb05SBarry Smith } else { 5899566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar))); 590071fcb05SBarry Smith } 591071fcb05SBarry Smith } 592071fcb05SBarry Smith ailen[row] = n; 593071fcb05SBarry Smith a->nz += n; 594071fcb05SBarry Smith } 5959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 5963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 597071fcb05SBarry Smith } 598071fcb05SBarry Smith 599ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 600d71ae5a4SJacob Faibussowitsch { 6017eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 60297f1f81fSBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 60397f1f81fSBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 6044e208921SJed Brown const MatScalar *ap, *aa; 6057eb43aa7SLois Curfman McInnes 6063a40ed3dSBarry Smith PetscFunctionBegin; 6074e208921SJed Brown PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 6087eb43aa7SLois Curfman McInnes for (k = 0; k < m; k++) { /* loop over rows */ 6097eb43aa7SLois Curfman McInnes row = im[k]; 6109371c9d4SSatish Balay if (row < 0) { 6119371c9d4SSatish Balay v += n; 6129371c9d4SSatish Balay continue; 6139371c9d4SSatish Balay } /* negative row */ 61454c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1); 615*8e3a54c0SPierre Jolivet rp = PetscSafePointerPlusOffset(aj, ai[row]); 616*8e3a54c0SPierre Jolivet ap = PetscSafePointerPlusOffset(aa, ai[row]); 6177eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6187eb43aa7SLois Curfman McInnes for (l = 0; l < n; l++) { /* loop over columns */ 6199371c9d4SSatish Balay if (in[l] < 0) { 6209371c9d4SSatish Balay v++; 6219371c9d4SSatish Balay continue; 6229371c9d4SSatish Balay } /* negative column */ 62354c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 624bfeeae90SHong Zhang col = in[l]; 6259371c9d4SSatish Balay high = nrow; 6269371c9d4SSatish Balay low = 0; /* assume unsorted */ 6277eb43aa7SLois Curfman McInnes while (high - low > 5) { 6287eb43aa7SLois Curfman McInnes t = (low + high) / 2; 6297eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6307eb43aa7SLois Curfman McInnes else low = t; 6317eb43aa7SLois Curfman McInnes } 6327eb43aa7SLois Curfman McInnes for (i = low; i < high; i++) { 6337eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6347eb43aa7SLois Curfman McInnes if (rp[i] == col) { 635b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6367eb43aa7SLois Curfman McInnes goto finished; 6377eb43aa7SLois Curfman McInnes } 6387eb43aa7SLois Curfman McInnes } 63997e567efSBarry Smith *v++ = 0.0; 6407eb43aa7SLois Curfman McInnes finished:; 6417eb43aa7SLois Curfman McInnes } 6427eb43aa7SLois Curfman McInnes } 6434e208921SJed Brown PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 6443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6457eb43aa7SLois Curfman McInnes } 6467eb43aa7SLois Curfman McInnes 647ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 648d71ae5a4SJacob Faibussowitsch { 6493ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ *)mat->data; 650c898d852SStefano Zampini const PetscScalar *av; 6513ea6fe3dSLisandro Dalcin PetscInt header[4], M, N, m, nz, i; 6523ea6fe3dSLisandro Dalcin PetscInt *rowlens; 65317ab2063SBarry Smith 6543a40ed3dSBarry Smith PetscFunctionBegin; 6559566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6562205254eSKarl Rupp 6573ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6583ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6593ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6603ea6fe3dSLisandro Dalcin nz = A->nz; 661416022c9SBarry Smith 6623ea6fe3dSLisandro Dalcin /* write matrix header */ 6633ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6649371c9d4SSatish Balay header[1] = M; 6659371c9d4SSatish Balay header[2] = N; 6669371c9d4SSatish Balay header[3] = nz; 6679566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT)); 668416022c9SBarry Smith 6693ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &rowlens)); 6713ea6fe3dSLisandro Dalcin for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i]; 6729566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT)); 6739566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6743ea6fe3dSLisandro Dalcin /* store column indices */ 6759566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT)); 676416022c9SBarry Smith /* store nonzero values */ 6779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat, &av)); 6789566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR)); 6799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat, &av)); 680b37d52dbSMark F. Adams 6813ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6829566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat, viewer)); 6833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 68417ab2063SBarry Smith } 685416022c9SBarry Smith 686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer) 687d71ae5a4SJacob Faibussowitsch { 6887dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 6897dc0baabSHong Zhang PetscInt i, k, m = A->rmap->N; 6907dc0baabSHong Zhang 6917dc0baabSHong Zhang PetscFunctionBegin; 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 6937dc0baabSHong Zhang for (i = 0; i < m; i++) { 6949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 69548a46eb9SPierre Jolivet for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k])); 6969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 6977dc0baabSHong Zhang } 6989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 6993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7007dc0baabSHong Zhang } 7017dc0baabSHong Zhang 70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer); 703cd155464SBarry Smith 704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer) 705d71ae5a4SJacob Faibussowitsch { 706416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 707c898d852SStefano Zampini const PetscScalar *av; 70860e0710aSBarry Smith PetscInt i, j, m = A->rmap->n; 709e060cb09SBarry Smith const char *name; 710f3ef73ceSBarry Smith PetscViewerFormat format; 71117ab2063SBarry Smith 7123a40ed3dSBarry Smith PetscFunctionBegin; 7137dc0baabSHong Zhang if (A->structure_only) { 7149566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer)); 7153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7167dc0baabSHong Zhang } 71743e49210SHong Zhang 7189566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 7193ba16761SJacob Faibussowitsch if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS); 7202e5835c6SStefano Zampini 721c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 7239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 72471c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 72597f1f81fSBarry Smith PetscInt nofinalvalue = 0; 72660e0710aSBarry Smith if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) { 727c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 728d00d2cf4SBarry Smith nofinalvalue = 1; 729d00d2cf4SBarry Smith } 7309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n)); 7329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz)); 733fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue)); 735fbfe6fa7SJed Brown #else 7369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue)); 737fbfe6fa7SJed Brown #endif 7389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n")); 73917ab2063SBarry Smith 74017ab2063SBarry Smith for (i = 0; i < m; i++) { 74160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 742aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 74417ab2063SBarry Smith #else 7459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j])); 74617ab2063SBarry Smith #endif 74717ab2063SBarry Smith } 74817ab2063SBarry Smith } 749d00d2cf4SBarry Smith if (nofinalvalue) { 750c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n", m, A->cmap->n, 0., 0.)); 752c337ccceSJed Brown #else 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n", m, A->cmap->n, 0.0)); 754c337ccceSJed Brown #endif 755d00d2cf4SBarry Smith } 7569566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A, &name)); 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name)); 7589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 759fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 76144cd7ae7SLois Curfman McInnes for (i = 0; i < m; i++) { 7629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 76360e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 764aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 76536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 76736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 76936db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 7716831982aSBarry Smith } 77244cd7ae7SLois Curfman McInnes #else 7739566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 77444cd7ae7SLois Curfman McInnes #endif 77544cd7ae7SLois Curfman McInnes } 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 77744cd7ae7SLois Curfman McInnes } 7789566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 779fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 78097f1f81fSBarry Smith PetscInt nzd = 0, fshift = 1, *sptr; 7819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 7829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &sptr)); 783496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 784496be53dSLois Curfman McInnes sptr[i] = nzd + 1; 78560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 786496be53dSLois Curfman McInnes if (a->j[j] >= i) { 787aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78836db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 789496be53dSLois Curfman McInnes #else 790496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 791496be53dSLois Curfman McInnes #endif 792496be53dSLois Curfman McInnes } 793496be53dSLois Curfman McInnes } 794496be53dSLois Curfman McInnes } 7952e44a96cSLois Curfman McInnes sptr[m] = nzd + 1; 7969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd)); 7972e44a96cSLois Curfman McInnes for (i = 0; i < m + 1; i += 6) { 7982205254eSKarl Rupp if (i + 4 < m) { 7999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5])); 8002205254eSKarl Rupp } else if (i + 3 < m) { 8019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4])); 8022205254eSKarl Rupp } else if (i + 2 < m) { 8039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3])); 8042205254eSKarl Rupp } else if (i + 1 < m) { 8059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2])); 8062205254eSKarl Rupp } else if (i < m) { 8079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1])); 8082205254eSKarl Rupp } else { 8099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i])); 8102205254eSKarl Rupp } 811496be53dSLois Curfman McInnes } 8129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 8139566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 814496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 81560e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8169566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift)); 817496be53dSLois Curfman McInnes } 8189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 819496be53dSLois Curfman McInnes } 8209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 821496be53dSLois Curfman McInnes for (i = 0; i < m; i++) { 82260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 823496be53dSLois Curfman McInnes if (a->j[j] >= i) { 824aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 82548a46eb9SPierre Jolivet if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 826496be53dSLois Curfman McInnes #else 8279566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j])); 828496be53dSLois Curfman McInnes #endif 829496be53dSLois Curfman McInnes } 830496be53dSLois Curfman McInnes } 8319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 832496be53dSLois Curfman McInnes } 8339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 834fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 83597f1f81fSBarry Smith PetscInt cnt = 0, jcnt; 83687828ca2SBarry Smith PetscScalar value; 83768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 83868f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 83968f1ed48SBarry Smith 84068f1ed48SBarry Smith for (i = 0; i < a->i[m]; i++) { 84168f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 84268f1ed48SBarry Smith realonly = PETSC_FALSE; 84368f1ed48SBarry Smith break; 84468f1ed48SBarry Smith } 84568f1ed48SBarry Smith } 84668f1ed48SBarry Smith #endif 84702594712SBarry Smith 8489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 84902594712SBarry Smith for (i = 0; i < m; i++) { 85002594712SBarry Smith jcnt = 0; 851d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 852e24b481bSBarry Smith if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) { 85302594712SBarry Smith value = a->a[cnt++]; 854e24b481bSBarry Smith jcnt++; 85502594712SBarry Smith } else { 85602594712SBarry Smith value = 0.0; 85702594712SBarry Smith } 858aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 85968f1ed48SBarry Smith if (realonly) { 8609566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value))); 86168f1ed48SBarry Smith } else { 8629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value))); 86368f1ed48SBarry Smith } 86402594712SBarry Smith #else 8659566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value)); 86602594712SBarry Smith #endif 86702594712SBarry Smith } 8689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 86902594712SBarry Smith } 8709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8713c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 872150b93efSMatthew G. Knepley PetscInt fshift = 1; 8739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 8743c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8759566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n")); 8763c215bfdSMatthew Knepley #else 8779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n")); 8783c215bfdSMatthew Knepley #endif 8799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 8803c215bfdSMatthew Knepley for (i = 0; i < m; i++) { 88160e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 8823c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8839566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 8843c215bfdSMatthew Knepley #else 8859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j])); 8863c215bfdSMatthew Knepley #endif 8873c215bfdSMatthew Knepley } 8883c215bfdSMatthew Knepley } 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 8903a40ed3dSBarry Smith } else { 8919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 892d5f3da31SBarry Smith if (A->factortype) { 89316cd7e1dSShri Abhyankar for (i = 0; i < m; i++) { 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 89516cd7e1dSShri Abhyankar /* L part */ 89660e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 89716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89816cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 8999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 90016cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 90216cd7e1dSShri Abhyankar } else { 9039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 90416cd7e1dSShri Abhyankar } 90516cd7e1dSShri Abhyankar #else 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 90716cd7e1dSShri Abhyankar #endif 90816cd7e1dSShri Abhyankar } 90916cd7e1dSShri Abhyankar /* diagonal */ 91016cd7e1dSShri Abhyankar j = a->diag[i]; 91116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91216cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j]))); 91416cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j])))); 91616cd7e1dSShri Abhyankar } else { 9179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j]))); 91816cd7e1dSShri Abhyankar } 91916cd7e1dSShri Abhyankar #else 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j]))); 92116cd7e1dSShri Abhyankar #endif 92216cd7e1dSShri Abhyankar 92316cd7e1dSShri Abhyankar /* U part */ 92460e0710aSBarry Smith for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) { 92516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 92616cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 92816cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j])))); 93016cd7e1dSShri Abhyankar } else { 9319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 93216cd7e1dSShri Abhyankar } 93316cd7e1dSShri Abhyankar #else 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 93516cd7e1dSShri Abhyankar #endif 93616cd7e1dSShri Abhyankar } 9379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 93816cd7e1dSShri Abhyankar } 93916cd7e1dSShri Abhyankar } else { 94017ab2063SBarry Smith for (i = 0; i < m; i++) { 9419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 94260e0710aSBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 943aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 94436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j]))); 94636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9479566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j]))); 9483a40ed3dSBarry Smith } else { 9499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j]))); 95017ab2063SBarry Smith } 95117ab2063SBarry Smith #else 9529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j])); 95317ab2063SBarry Smith #endif 95417ab2063SBarry Smith } 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 95617ab2063SBarry Smith } 95716cd7e1dSShri Abhyankar } 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 95917ab2063SBarry Smith } 9609566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 962416022c9SBarry Smith } 963416022c9SBarry Smith 9649804daf3SBarry Smith #include <petscdraw.h> 965ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 966d71ae5a4SJacob Faibussowitsch { 967480ef9eaSBarry Smith Mat A = (Mat)Aa; 968416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 969383922c3SLisandro Dalcin PetscInt i, j, m = A->rmap->n; 970383922c3SLisandro Dalcin int color; 971b05fc000SLisandro Dalcin PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 972b0a32e0cSBarry Smith PetscViewer viewer; 973f3ef73ceSBarry Smith PetscViewerFormat format; 974fff043a9SJunchao Zhang const PetscScalar *aa; 975cddf8d76SBarry Smith 9763a40ed3dSBarry Smith PetscFunctionBegin; 9779566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 9789566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 9799566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 980383922c3SLisandro Dalcin 981416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 983fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 984d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 9850513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 986b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 987416022c9SBarry Smith for (i = 0; i < m; i++) { 9889371c9d4SSatish Balay y_l = m - i - 1.0; 9899371c9d4SSatish Balay y_r = y_l + 1.0; 990bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 9919371c9d4SSatish Balay x_l = a->j[j]; 9929371c9d4SSatish Balay x_r = x_l + 1.0; 993fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 9949566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 995cddf8d76SBarry Smith } 996cddf8d76SBarry Smith } 997b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 998cddf8d76SBarry Smith for (i = 0; i < m; i++) { 9999371c9d4SSatish Balay y_l = m - i - 1.0; 10009371c9d4SSatish Balay y_r = y_l + 1.0; 1001bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10029371c9d4SSatish Balay x_l = a->j[j]; 10039371c9d4SSatish Balay x_r = x_l + 1.0; 1004fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10059566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1006cddf8d76SBarry Smith } 1007cddf8d76SBarry Smith } 1008b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1009cddf8d76SBarry Smith for (i = 0; i < m; i++) { 10109371c9d4SSatish Balay y_l = m - i - 1.0; 10119371c9d4SSatish Balay y_r = y_l + 1.0; 1012bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 10139371c9d4SSatish Balay x_l = a->j[j]; 10149371c9d4SSatish Balay x_r = x_l + 1.0; 1015fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10169566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 1017416022c9SBarry Smith } 1018416022c9SBarry Smith } 1019d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10200513a670SBarry Smith } else { 10210513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10220513a670SBarry Smith /* first determine max of all nonzero values */ 1023b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1024383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1025b0a32e0cSBarry Smith PetscDraw popup; 10260513a670SBarry Smith 10270513a670SBarry Smith for (i = 0; i < nz; i++) { 1028fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10290513a670SBarry Smith } 1030383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10319566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw, &popup)); 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup, minv, maxv)); 1033383922c3SLisandro Dalcin 1034d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 10350513a670SBarry Smith for (i = 0; i < m; i++) { 1036383922c3SLisandro Dalcin y_l = m - i - 1.0; 1037383922c3SLisandro Dalcin y_r = y_l + 1.0; 1038bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1039383922c3SLisandro Dalcin x_l = a->j[j]; 1040383922c3SLisandro Dalcin x_r = x_l + 1.0; 1041fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv); 10429566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color)); 10430513a670SBarry Smith count++; 10440513a670SBarry Smith } 10450513a670SBarry Smith } 1046d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 10470513a670SBarry Smith } 10489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1050480ef9eaSBarry Smith } 1051cddf8d76SBarry Smith 10529804daf3SBarry Smith #include <petscdraw.h> 1053ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer) 1054d71ae5a4SJacob Faibussowitsch { 1055b0a32e0cSBarry Smith PetscDraw draw; 105636db0b34SBarry Smith PetscReal xr, yr, xl, yl, h, w; 1057ace3abfcSBarry Smith PetscBool isnull; 1058480ef9eaSBarry Smith 1059480ef9eaSBarry Smith PetscFunctionBegin; 10609566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 10619566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 10623ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 1063480ef9eaSBarry Smith 10649371c9d4SSatish Balay xr = A->cmap->n; 10659371c9d4SSatish Balay yr = A->rmap->n; 10669371c9d4SSatish Balay h = yr / 10.0; 10679371c9d4SSatish Balay w = xr / 10.0; 10689371c9d4SSatish Balay xr += w; 10699371c9d4SSatish Balay yr += h; 10709371c9d4SSatish Balay xl = -w; 10719371c9d4SSatish Balay yl = -h; 10729566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 10739566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 10749566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 10769566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1078416022c9SBarry Smith } 1079416022c9SBarry Smith 1080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer) 1081d71ae5a4SJacob Faibussowitsch { 1082ace3abfcSBarry Smith PetscBool iascii, isbinary, isdraw; 1083416022c9SBarry Smith 10843a40ed3dSBarry Smith PetscFunctionBegin; 10859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 10879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 10881baa6e33SBarry Smith if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer)); 10891baa6e33SBarry Smith else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer)); 10901baa6e33SBarry Smith else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer)); 10919566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A, viewer)); 10923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109317ab2063SBarry Smith } 109419bcc07fSBarry Smith 1095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode) 1096d71ae5a4SJacob Faibussowitsch { 1097416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1098580bdb30SBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 1099bc43efbbSJunchao Zhang PetscInt m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n; 110054f21887SBarry Smith MatScalar *aa = a->a, *ap; 11013447b6efSHong Zhang PetscReal ratio = 0.6; 110217ab2063SBarry Smith 11033a40ed3dSBarry Smith PetscFunctionBegin; 11043ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 11059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1106b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1107b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11089566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1110b215bc84SStefano Zampini } 111117ab2063SBarry Smith 111243ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 111317ab2063SBarry Smith for (i = 1; i < m; i++) { 1114416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 111517ab2063SBarry Smith fshift += imax[i - 1] - ailen[i - 1]; 111694a9d846SBarry Smith rmax = PetscMax(rmax, ailen[i]); 111717ab2063SBarry Smith if (fshift) { 1118bfeeae90SHong Zhang ip = aj + ai[i]; 1119bfeeae90SHong Zhang ap = aa + ai[i]; 112017ab2063SBarry Smith N = ailen[i]; 11219566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 112248a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N)); 112317ab2063SBarry Smith } 112417ab2063SBarry Smith ai[i] = ai[i - 1] + ailen[i - 1]; 112517ab2063SBarry Smith } 112617ab2063SBarry Smith if (m) { 112717ab2063SBarry Smith fshift += imax[m - 1] - ailen[m - 1]; 112817ab2063SBarry Smith ai[m] = ai[m - 1] + ailen[m - 1]; 112917ab2063SBarry Smith } 113017ab2063SBarry Smith /* reset ilen and imax for each row */ 11317b083b7cSBarry Smith a->nonzerorowcnt = 0; 1132396832f4SHong Zhang if (A->structure_only) { 11339566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11349566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1135396832f4SHong Zhang } else { /* !A->structure_only */ 113617ab2063SBarry Smith for (i = 0; i < m; i++) { 113717ab2063SBarry Smith ailen[i] = imax[i] = ai[i + 1] - ai[i]; 11387b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0); 113917ab2063SBarry Smith } 1140396832f4SHong Zhang } 1141bfeeae90SHong Zhang a->nz = ai[m]; 1142aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 1143bc43efbbSJunchao Zhang PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly 1144bc43efbbSJunchao Zhang a->diagonaldense = PETSC_TRUE; 1145bc43efbbSJunchao Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1146bc43efbbSJunchao Zhang for (i = 0; i < n; i++) { 1147bc43efbbSJunchao Zhang if (a->diag[i] >= ai[i + 1]) { 1148bc43efbbSJunchao Zhang a->diagonaldense = PETSC_FALSE; 1149bc43efbbSJunchao Zhang break; 1150bc43efbbSJunchao Zhang } 1151bc43efbbSJunchao Zhang } 11529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz)); 11539566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs)); 11549566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax)); 11552205254eSKarl Rupp 11568e58a170SBarry Smith A->info.mallocs += a->reallocs; 1157dd5f02e7SSatish Balay a->reallocs = 0; 11586712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 115936db0b34SBarry Smith a->rmax = rmax; 11604e220ebcSLois Curfman McInnes 116148a46eb9SPierre Jolivet if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio)); 11629566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); 11633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 116417ab2063SBarry Smith } 116517ab2063SBarry Smith 1166ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A) 1167d71ae5a4SJacob Faibussowitsch { 116899cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 116999cafbc1SBarry Smith PetscInt i, nz = a->nz; 11702e5835c6SStefano Zampini MatScalar *aa; 117199cafbc1SBarry Smith 117299cafbc1SBarry Smith PetscFunctionBegin; 11739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 117499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 117899cafbc1SBarry Smith } 117999cafbc1SBarry Smith 1180ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 1181d71ae5a4SJacob Faibussowitsch { 118299cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 118399cafbc1SBarry Smith PetscInt i, nz = a->nz; 11842e5835c6SStefano Zampini MatScalar *aa; 118599cafbc1SBarry Smith 118699cafbc1SBarry Smith PetscFunctionBegin; 11879566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 118899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 11909566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 11913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119299cafbc1SBarry Smith } 119399cafbc1SBarry Smith 1194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 1195d71ae5a4SJacob Faibussowitsch { 1196fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1197fff043a9SJunchao Zhang MatScalar *aa; 11983a40ed3dSBarry Smith 11993a40ed3dSBarry Smith PetscFunctionBegin; 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A, &aa)); 12019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa, a->i[A->rmap->n])); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa)); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120517ab2063SBarry Smith } 1206416022c9SBarry Smith 1207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A) 1208d71ae5a4SJacob Faibussowitsch { 1209416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1210d5d45c9bSBarry Smith 12113a40ed3dSBarry Smith PetscFunctionBegin; 1212b4e2f619SBarry Smith if (A->hash_active) { 1213e3c72094SPierre Jolivet A->ops[0] = a->cops; 1214b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 1215b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 1216b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 1217b4e2f619SBarry Smith } 1218b4e2f619SBarry Smith 12193ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz)); 12209566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 12219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12229566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12239566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12249566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12279566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12289566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work)); 12299566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12319566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12329566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex)); 12339566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12349566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1235901853e0SKris Buschelman 12366718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12376718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12386718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12396718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12406718818eSStefano Zampini due to different matrix sizes */ 12419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL)); 12426718818eSStefano Zampini 12439566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 12442e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL)); 12452e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL)); 12469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL)); 12479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 12489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 12499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL)); 12509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL)); 12519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL)); 12522e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL)); 12532e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE) 12542e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL)); 12552e956fe4SStefano Zampini #endif 12564222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL)); 12589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL)); 12599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL)); 12604222ddf1SHong Zhang #endif 1261d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 1262d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL)); 1263d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL)); 1264d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL)); 1265d5e393b6SSuyash Tandon #endif 12663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL)); 12683d0639e7SStefano Zampini #endif 12699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL)); 1270af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL)); 1272af8000cdSHong Zhang #endif 1273d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL)); 1275d24d4204SJose E. Roman #endif 127663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL)); 12789566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL)); 127963c07aadSStefano Zampini #endif 12809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL)); 12819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL)); 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL)); 12839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL)); 12842e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL)); 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL)); 12879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL)); 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL)); 12952e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 12962e956fe4SStefano Zampini /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */ 12972e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL)); 12982e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL)); 12992e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL)); 13002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL)); 13012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL)); 13023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 130317ab2063SBarry Smith } 130417ab2063SBarry Smith 1305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg) 1306d71ae5a4SJacob Faibussowitsch { 1307416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 13083a40ed3dSBarry Smith 13093a40ed3dSBarry Smith PetscFunctionBegin; 1310a65d3064SKris Buschelman switch (op) { 1311d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 1312d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 1313d71ae5a4SJacob Faibussowitsch break; 1314d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 1315d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 1316d71ae5a4SJacob Faibussowitsch break; 1317d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 1318d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 1319d71ae5a4SJacob Faibussowitsch break; 1320d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 1321d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 1322d71ae5a4SJacob Faibussowitsch break; 1323d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 1324d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 1325d71ae5a4SJacob Faibussowitsch break; 1326d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 1327d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 1328d71ae5a4SJacob Faibussowitsch break; 1329d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_ZERO_ENTRIES: 1330d71ae5a4SJacob Faibussowitsch a->ignorezeroentries = flg; 1331d71ae5a4SJacob Faibussowitsch break; 13323d472b54SHong Zhang case MAT_SPD: 1333b1646e73SJed Brown case MAT_SYMMETRIC: 1334b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1335b1646e73SJed Brown case MAT_HERMITIAN: 1336b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1337957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 1338b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 1339b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 1340b94d7dedSBarry Smith /* if the diagonal matrix is square it inherits some of the properties above */ 13415021d80fSJed Brown break; 13428c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1343a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1344d71ae5a4SJacob Faibussowitsch case MAT_USE_HASH_TABLE: 1345d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 1346d71ae5a4SJacob Faibussowitsch break; 1347d71ae5a4SJacob Faibussowitsch case MAT_USE_INODES: 1348d71ae5a4SJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg)); 1349d71ae5a4SJacob Faibussowitsch break; 1350d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 1351d71ae5a4SJacob Faibussowitsch A->submat_singleis = flg; 1352d71ae5a4SJacob Faibussowitsch break; 1353071fcb05SBarry Smith case MAT_SORTED_FULL: 1354071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1355071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1356071fcb05SBarry Smith break; 1357d71ae5a4SJacob Faibussowitsch case MAT_FORM_EXPLICIT_TRANSPOSE: 1358d71ae5a4SJacob Faibussowitsch A->form_explicit_transpose = flg; 1359d71ae5a4SJacob Faibussowitsch break; 1360d71ae5a4SJacob Faibussowitsch default: 1361d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 1362a65d3064SKris Buschelman } 13633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 136417ab2063SBarry Smith } 136517ab2063SBarry Smith 1366ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v) 1367d71ae5a4SJacob Faibussowitsch { 1368416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1369fdc842d1SBarry Smith PetscInt i, j, n, *ai = a->i, *aj = a->j; 1370c898d852SStefano Zampini PetscScalar *x; 1371c898d852SStefano Zampini const PetscScalar *aa; 137217ab2063SBarry Smith 13733a40ed3dSBarry Smith PetscFunctionBegin; 13749566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 137508401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 13769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 1377d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1378d3e70bfaSHong Zhang PetscInt *diag = a->diag; 13799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 13802c990fa1SHong Zhang for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]]; 13819566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 138435e7444dSHong Zhang } 138535e7444dSHong Zhang 13869566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 138735e7444dSHong Zhang for (i = 0; i < n; i++) { 1388fdc842d1SBarry Smith x[i] = 0.0; 138935e7444dSHong Zhang for (j = ai[i]; j < ai[i + 1]; j++) { 139035e7444dSHong Zhang if (aj[j] == i) { 139135e7444dSHong Zhang x[i] = aa[j]; 139217ab2063SBarry Smith break; 139317ab2063SBarry Smith } 139417ab2063SBarry Smith } 139517ab2063SBarry Smith } 13969566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 13979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 13983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 139917ab2063SBarry Smith } 140017ab2063SBarry Smith 1401c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy) 1403d71ae5a4SJacob Faibussowitsch { 1404416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 14055f22a7b3SSebastian Grimberg const MatScalar *aa; 1406d9ca1df4SBarry Smith PetscScalar *y; 1407d9ca1df4SBarry Smith const PetscScalar *x; 1408d0f46423SBarry Smith PetscInt m = A->rmap->n; 14095c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14105f22a7b3SSebastian Grimberg const MatScalar *v; 1411a77337e4SBarry Smith PetscScalar alpha; 1412d9ca1df4SBarry Smith PetscInt n, i, j; 1413d9ca1df4SBarry Smith const PetscInt *idx, *ii, *ridx = NULL; 14143447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1415ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14165c897100SBarry Smith #endif 141717ab2063SBarry Smith 14183a40ed3dSBarry Smith PetscFunctionBegin; 14199566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz, yy)); 14209566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14219566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 14229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 14235c897100SBarry Smith 14245c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1425fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y); 14265c897100SBarry Smith #else 14273447b6efSHong Zhang if (usecprow) { 14283447b6efSHong Zhang m = cprow.nrows; 14293447b6efSHong Zhang ii = cprow.i; 14307b2bb3b9SHong Zhang ridx = cprow.rindex; 14313447b6efSHong Zhang } else { 14323447b6efSHong Zhang ii = a->i; 14333447b6efSHong Zhang } 143417ab2063SBarry Smith for (i = 0; i < m; i++) { 14353447b6efSHong Zhang idx = a->j + ii[i]; 1436fff043a9SJunchao Zhang v = aa + ii[i]; 14373447b6efSHong Zhang n = ii[i + 1] - ii[i]; 14383447b6efSHong Zhang if (usecprow) { 14397b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14403447b6efSHong Zhang } else { 144117ab2063SBarry Smith alpha = x[i]; 14423447b6efSHong Zhang } 144304fbf559SBarry Smith for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j]; 144417ab2063SBarry Smith } 14455c897100SBarry Smith #endif 14469566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 14479566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 14489566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 14499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 14503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145117ab2063SBarry Smith } 145217ab2063SBarry Smith 1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy) 1454d71ae5a4SJacob Faibussowitsch { 14555c897100SBarry Smith PetscFunctionBegin; 14569566063dSJacob Faibussowitsch PetscCall(VecSet(yy, 0.0)); 14579566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy)); 14583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14595c897100SBarry Smith } 14605c897100SBarry Smith 1461c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146278b84d54SShri Abhyankar 1463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy) 1464d71ae5a4SJacob Faibussowitsch { 1465416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1466d9fead3dSBarry Smith PetscScalar *y; 146754f21887SBarry Smith const PetscScalar *x; 1468fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1469003131ecSBarry Smith PetscInt m = A->rmap->n; 14700298fd71SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 14717b083b7cSBarry Smith PetscInt n, i; 1472362ced78SSatish Balay PetscScalar sum; 1473ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 147417ab2063SBarry Smith 1475b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147697952fefSHong Zhang #pragma disjoint(*x, *y, *aa) 1477fee21e36SBarry Smith #endif 1478fee21e36SBarry Smith 14793a40ed3dSBarry Smith PetscFunctionBegin; 1480b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14819566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy)); 14823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1483b215bc84SStefano Zampini } 14849566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 14859566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 14869566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1487416022c9SBarry Smith ii = a->i; 14884eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14899566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y, m)); 149097952fefSHong Zhang m = a->compressedrow.nrows; 149197952fefSHong Zhang ii = a->compressedrow.i; 149297952fefSHong Zhang ridx = a->compressedrow.rindex; 149397952fefSHong Zhang for (i = 0; i < m; i++) { 149497952fefSHong Zhang n = ii[i + 1] - ii[i]; 149597952fefSHong Zhang aj = a->j + ii[i]; 1496fff043a9SJunchao Zhang aa = a_a + ii[i]; 149797952fefSHong Zhang sum = 0.0; 1498003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 1499003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 150097952fefSHong Zhang y[*ridx++] = sum; 150197952fefSHong Zhang } 150297952fefSHong Zhang } else { /* do not use compressed row format */ 1503b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15043d3eaba7SBarry Smith aj = a->j; 1505fff043a9SJunchao Zhang aa = a_a; 1506b05257ddSBarry Smith fortranmultaij_(&m, x, ii, aj, aa, y); 1507b05257ddSBarry Smith #else 150817ab2063SBarry Smith for (i = 0; i < m; i++) { 1509003131ecSBarry Smith n = ii[i + 1] - ii[i]; 1510003131ecSBarry Smith aj = a->j + ii[i]; 1511fff043a9SJunchao Zhang aa = a_a + ii[i]; 151217ab2063SBarry Smith sum = 0.0; 1513003131ecSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 151417ab2063SBarry Smith y[i] = sum; 151517ab2063SBarry Smith } 15168d195f9aSBarry Smith #endif 1517b05257ddSBarry Smith } 15189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt)); 15199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15209566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152317ab2063SBarry Smith } 152417ab2063SBarry Smith 1525ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1526ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy) 1527d71ae5a4SJacob Faibussowitsch { 1528b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1529b434eb95SMatthew G. Knepley PetscScalar *y; 1530b434eb95SMatthew G. Knepley const PetscScalar *x; 1531fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1532b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n; 1533b434eb95SMatthew G. Knepley const PetscInt *aj, *ii, *ridx = NULL; 1534b434eb95SMatthew G. Knepley PetscInt n, i, nonzerorow = 0; 1535b434eb95SMatthew G. Knepley PetscScalar sum; 1536b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1537b434eb95SMatthew G. Knepley 1538b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1539b434eb95SMatthew G. Knepley #pragma disjoint(*x, *y, *aa) 1540b434eb95SMatthew G. Knepley #endif 1541b434eb95SMatthew G. Knepley 1542b434eb95SMatthew G. Knepley PetscFunctionBegin; 15439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15459566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy, &y)); 1546b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1547b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1548b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1549b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1550b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1551b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1552b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1553fff043a9SJunchao Zhang aa = a_a + ii[i]; 1554b434eb95SMatthew G. Knepley sum = 0.0; 1555b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1556b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1557b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1558b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1559b434eb95SMatthew G. Knepley } 1560b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15613d3eaba7SBarry Smith ii = a->i; 1562b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1563b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1564b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1565fff043a9SJunchao Zhang aa = a_a + ii[i]; 1566b434eb95SMatthew G. Knepley sum = 0.0; 1567b434eb95SMatthew G. Knepley nonzerorow += (n > 0); 1568b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1569b434eb95SMatthew G. Knepley y[i] = sum; 1570b434eb95SMatthew G. Knepley } 1571b434eb95SMatthew G. Knepley } 15729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow)); 15739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 15749566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy, &y)); 15759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 15763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1577b434eb95SMatthew G. Knepley } 1578b434eb95SMatthew G. Knepley 1579ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c 1580ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1581d71ae5a4SJacob Faibussowitsch { 1582b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1583b434eb95SMatthew G. Knepley PetscScalar *y, *z; 1584b434eb95SMatthew G. Knepley const PetscScalar *x; 1585fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1586b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n, *aj, *ii; 1587b434eb95SMatthew G. Knepley PetscInt n, i, *ridx = NULL; 1588b434eb95SMatthew G. Knepley PetscScalar sum; 1589b434eb95SMatthew G. Knepley PetscBool usecprow = a->compressedrow.use; 1590b434eb95SMatthew G. Knepley 1591b434eb95SMatthew G. Knepley PetscFunctionBegin; 15929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 15939566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 15949566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 1595b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 159648a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 1597b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1598b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1599b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1600b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1601b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1602b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1603fff043a9SJunchao Zhang aa = a_a + ii[i]; 1604b434eb95SMatthew G. Knepley sum = y[*ridx]; 1605b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1606b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1607b434eb95SMatthew G. Knepley } 1608b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16093d3eaba7SBarry Smith ii = a->i; 1610b434eb95SMatthew G. Knepley for (i = 0; i < m; i++) { 1611b434eb95SMatthew G. Knepley n = ii[i + 1] - ii[i]; 1612b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1613fff043a9SJunchao Zhang aa = a_a + ii[i]; 1614b434eb95SMatthew G. Knepley sum = y[i]; 1615b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum, x, aa, aj, n); 1616b434eb95SMatthew G. Knepley z[i] = sum; 1617b434eb95SMatthew G. Knepley } 1618b434eb95SMatthew G. Knepley } 16199566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1624b434eb95SMatthew G. Knepley } 1625b434eb95SMatthew G. Knepley 1626c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1627d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz) 1628d71ae5a4SJacob Faibussowitsch { 1629416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1630f15663dcSBarry Smith PetscScalar *y, *z; 1631f15663dcSBarry Smith const PetscScalar *x; 1632fff043a9SJunchao Zhang const MatScalar *aa, *a_a; 1633d9ca1df4SBarry Smith const PetscInt *aj, *ii, *ridx = NULL; 1634d9ca1df4SBarry Smith PetscInt m = A->rmap->n, n, i; 1635362ced78SSatish Balay PetscScalar sum; 1636ace3abfcSBarry Smith PetscBool usecprow = a->compressedrow.use; 16379ea0dfa2SSatish Balay 16383a40ed3dSBarry Smith PetscFunctionBegin; 1639b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16409566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz)); 16413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1642b215bc84SStefano Zampini } 16439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &a_a)); 16449566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx, &x)); 16459566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy, zz, &y, &z)); 16464eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 164748a46eb9SPierre Jolivet if (zz != yy) PetscCall(PetscArraycpy(z, y, m)); 164897952fefSHong Zhang m = a->compressedrow.nrows; 164997952fefSHong Zhang ii = a->compressedrow.i; 165097952fefSHong Zhang ridx = a->compressedrow.rindex; 165197952fefSHong Zhang for (i = 0; i < m; i++) { 165297952fefSHong Zhang n = ii[i + 1] - ii[i]; 165397952fefSHong Zhang aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165597952fefSHong Zhang sum = y[*ridx]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 165797952fefSHong Zhang z[*ridx++] = sum; 165897952fefSHong Zhang } 165997952fefSHong Zhang } else { /* do not use compressed row format */ 16603d3eaba7SBarry Smith ii = a->i; 1661f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16623d3eaba7SBarry Smith aj = a->j; 1663fff043a9SJunchao Zhang aa = a_a; 1664f15663dcSBarry Smith fortranmultaddaij_(&m, x, ii, aj, aa, y, z); 1665f15663dcSBarry Smith #else 166617ab2063SBarry Smith for (i = 0; i < m; i++) { 1667f15663dcSBarry Smith n = ii[i + 1] - ii[i]; 1668f15663dcSBarry Smith aj = a->j + ii[i]; 1669fff043a9SJunchao Zhang aa = a_a + ii[i]; 167017ab2063SBarry Smith sum = y[i]; 1671f15663dcSBarry Smith PetscSparseDensePlusDot(sum, x, aa, aj, n); 167217ab2063SBarry Smith z[i] = sum; 167317ab2063SBarry Smith } 167402ab625aSSatish Balay #endif 1675f15663dcSBarry Smith } 16769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx, &x)); 16789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy, zz, &y, &z)); 16799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a)); 16803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168117ab2063SBarry Smith } 168217ab2063SBarry Smith 168317ab2063SBarry Smith /* 168417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168517ab2063SBarry Smith */ 1686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 1687d71ae5a4SJacob Faibussowitsch { 1688416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1689d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n; 1690c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169117ab2063SBarry Smith 16923a40ed3dSBarry Smith PetscFunctionBegin; 169309f38230SBarry Smith if (!a->diag) { 16949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &a->diag)); 1695c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169609f38230SBarry Smith } 1697d0f46423SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1698c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1699c0c07093SJunchao Zhang if (alreadySet) { 1700c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1701c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue; 1702c0c07093SJunchao Zhang } 1703c0c07093SJunchao Zhang 170409f38230SBarry Smith a->diag[i] = a->i[i + 1]; 1705bfeeae90SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 1706bfeeae90SHong Zhang if (a->j[j] == i) { 170709f38230SBarry Smith a->diag[i] = j; 170817ab2063SBarry Smith break; 170917ab2063SBarry Smith } 171017ab2063SBarry Smith } 171117ab2063SBarry Smith } 17123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 171317ab2063SBarry Smith } 171417ab2063SBarry Smith 1715ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v) 1716d71ae5a4SJacob Faibussowitsch { 171761ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 171861ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt *)a->diag; 171961ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt *)a->i; 172061ecd0c6SBarry Smith PetscInt i, *mdiag = NULL; 172161ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172261ecd0c6SBarry Smith 172361ecd0c6SBarry Smith PetscFunctionBegin; 172461ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL)); 17269566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 17273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172861ecd0c6SBarry Smith } 172961ecd0c6SBarry Smith 173061ecd0c6SBarry Smith if (a->diagonaldense) { 173161ecd0c6SBarry Smith cnt = 0; 173261ecd0c6SBarry Smith } else { 17339566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &mdiag)); 173461ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 1735349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */ 173661ecd0c6SBarry Smith cnt++; 173761ecd0c6SBarry Smith mdiag[i] = 1; 173861ecd0c6SBarry Smith } 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith if (!cnt) { 17429566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A, v)); 174361ecd0c6SBarry Smith } else { 1744b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1745b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174661ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij; 17476ea2a7edSJunchao Zhang const PetscScalar *Aa; 17486ea2a7edSJunchao Zhang 17496ea2a7edSJunchao Zhang PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host 17506ea2a7edSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa)); 175161ecd0c6SBarry Smith 175261ecd0c6SBarry Smith a->a = NULL; 175361ecd0c6SBarry Smith a->j = NULL; 175461ecd0c6SBarry Smith a->i = NULL; 175561ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1756ad540459SPierre Jolivet for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i]; 17579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax)); 175861ecd0c6SBarry Smith 175961ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 176061ecd0c6SBarry Smith for (i = 0; i < A->rmap->n; i++) { 17619566063dSJacob Faibussowitsch PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES)); 176248a46eb9SPierre Jolivet if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES)); 1763447d62f5SStefano Zampini } 17649566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 176661ecd0c6SBarry Smith if (singlemalloc) { 17679566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda, oldj, oldi)); 176861ecd0c6SBarry Smith } else { 17699566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17709566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17719566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177261ecd0c6SBarry Smith } 177361ecd0c6SBarry Smith } 17749566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177561ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 17763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 177761ecd0c6SBarry Smith } 177861ecd0c6SBarry Smith 1779be5855fcSBarry Smith /* 1780be5855fcSBarry Smith Checks for missing diagonals 1781be5855fcSBarry Smith */ 1782d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d) 1783d71ae5a4SJacob Faibussowitsch { 1784be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 17857734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 1786be5855fcSBarry Smith 1787be5855fcSBarry Smith PetscFunctionBegin; 178809f38230SBarry Smith *missing = PETSC_FALSE; 17897734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179009f38230SBarry Smith *missing = PETSC_TRUE; 179109f38230SBarry Smith if (d) *d = 0; 17929566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 179309f38230SBarry Smith } else { 179401445905SHong Zhang PetscInt n; 179501445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1796f1e2ffcdSBarry Smith diag = a->diag; 179701445905SHong Zhang for (i = 0; i < n; i++) { 17987734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 179909f38230SBarry Smith *missing = PETSC_TRUE; 180009f38230SBarry Smith if (d) *d = i; 18019566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i)); 1802358d2f5dSShri Abhyankar break; 180309f38230SBarry Smith } 1804be5855fcSBarry Smith } 1805be5855fcSBarry Smith } 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1807be5855fcSBarry Smith } 1808be5855fcSBarry Smith 18090da83c2eSBarry Smith #include <petscblaslapack.h> 18100da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18110da83c2eSBarry Smith 18120da83c2eSBarry Smith /* 18130da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18140da83c2eSBarry Smith */ 1815ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag) 1816d71ae5a4SJacob Faibussowitsch { 18170da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots; 18180da83c2eSBarry Smith PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 18190da83c2eSBarry Smith const PetscReal shift = 0.0; 18200da83c2eSBarry Smith PetscInt ipvt[5]; 18214e208921SJed Brown PetscCount flops = 0; 18220da83c2eSBarry Smith PetscScalar work[25], *v_work; 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith PetscFunctionBegin; 18250da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18260da83c2eSBarry Smith for (i = 0; i < nblocks; i++) ncnt += bsizes[i]; 182708401ef6SPierre Jolivet PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n); 1828ad540459SPierre Jolivet for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]); 18299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax, &indx)); 183048a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots)); 18310da83c2eSBarry Smith ncnt = 0; 18320da83c2eSBarry Smith for (i = 0; i < nblocks; i++) { 18330da83c2eSBarry Smith for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j; 18349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag)); 18350da83c2eSBarry Smith switch (bsizes[i]) { 1836d71ae5a4SJacob Faibussowitsch case 1: 1837d71ae5a4SJacob Faibussowitsch *diag = 1.0 / (*diag); 1838d71ae5a4SJacob Faibussowitsch break; 18390da83c2eSBarry Smith case 2: 18409566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 18410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18429566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18430da83c2eSBarry Smith break; 18440da83c2eSBarry Smith case 3: 18459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 18460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18479566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18480da83c2eSBarry Smith break; 18490da83c2eSBarry Smith case 4: 18509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 18510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18530da83c2eSBarry Smith break; 18540da83c2eSBarry Smith case 5: 18559566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 18560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18579566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18580da83c2eSBarry Smith break; 18590da83c2eSBarry Smith case 6: 18609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 18610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18630da83c2eSBarry Smith break; 18640da83c2eSBarry Smith case 7: 18659566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 18660da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18679566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18680da83c2eSBarry Smith break; 18690da83c2eSBarry Smith default: 18709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 18710da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i])); 18730da83c2eSBarry Smith } 18740da83c2eSBarry Smith ncnt += bsizes[i]; 18750da83c2eSBarry Smith diag += bsizes[i] * bsizes[i]; 18764e208921SJed Brown flops += 2 * PetscPowInt(bsizes[i], 3) / 3; 18770da83c2eSBarry Smith } 18783ba16761SJacob Faibussowitsch PetscCall(PetscLogFlops(flops)); 187948a46eb9SPierre Jolivet if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots)); 18809566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18820da83c2eSBarry Smith } 18830da83c2eSBarry Smith 1884422a814eSBarry Smith /* 1885422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1886422a814eSBarry Smith */ 1887ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift) 1888d71ae5a4SJacob Faibussowitsch { 188971f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1890d0f46423SBarry Smith PetscInt i, *diag, m = A->rmap->n; 18912e5835c6SStefano Zampini const MatScalar *v; 189254f21887SBarry Smith PetscScalar *idiag, *mdiag; 189371f1c65dSBarry Smith 189471f1c65dSBarry Smith PetscFunctionBegin; 18953ba16761SJacob Faibussowitsch if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS); 18969566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 189771f1c65dSBarry Smith diag = a->diag; 18984dfa11a4SJacob Faibussowitsch if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); } 18992e5835c6SStefano Zampini 190071f1c65dSBarry Smith mdiag = a->mdiag; 190171f1c65dSBarry Smith idiag = a->idiag; 19029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 1903422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 190471f1c65dSBarry Smith for (i = 0; i < m; i++) { 190571f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1906899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1907899639b0SHong Zhang if (PetscRealPart(fshift)) { 19089566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i)); 19097b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19107b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19117b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191298921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i); 1913899639b0SHong Zhang } 191471f1c65dSBarry Smith idiag[i] = 1.0 / v[diag[i]]; 191571f1c65dSBarry Smith } 19169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 191771f1c65dSBarry Smith } else { 191871f1c65dSBarry Smith for (i = 0; i < m; i++) { 191971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192071f1c65dSBarry Smith idiag[i] = omega / (fshift + v[diag[i]]); 192171f1c65dSBarry Smith } 19229566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * m)); 192371f1c65dSBarry Smith } 192471f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 19263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 192771f1c65dSBarry Smith } 192871f1c65dSBarry Smith 1929c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 1930d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx) 1931d71ae5a4SJacob Faibussowitsch { 1932416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 1933e6d1f457SBarry Smith PetscScalar *x, d, sum, *t, scale; 19342e5835c6SStefano Zampini const MatScalar *v, *idiag = NULL, *mdiag, *aa; 193554f21887SBarry Smith const PetscScalar *b, *bs, *xb, *ts; 19363d3eaba7SBarry Smith PetscInt n, m = A->rmap->n, i; 193797f1f81fSBarry Smith const PetscInt *idx, *diag; 193817ab2063SBarry Smith 19393a40ed3dSBarry Smith PetscFunctionBegin; 1940b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19419566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx)); 19423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1943b215bc84SStefano Zampini } 1944b965ef7fSBarry Smith its = its * lits; 194591723122SBarry Smith 194671f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19479566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift)); 194871f1c65dSBarry Smith a->fshift = fshift; 194971f1c65dSBarry Smith a->omega = omega; 1950ed480e8bSBarry Smith 195171f1c65dSBarry Smith diag = a->diag; 195271f1c65dSBarry Smith t = a->ssor_work; 1953ed480e8bSBarry Smith idiag = a->idiag; 195471f1c65dSBarry Smith mdiag = a->mdiag; 1955ed480e8bSBarry Smith 19569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 19579566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx, &x)); 19589566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb, &b)); 1959ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 196017ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196117ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1962ed480e8bSBarry Smith bs = b; 196317ab2063SBarry Smith for (i = 0; i < m; i++) { 196471f1c65dSBarry Smith d = fshift + mdiag[i]; 1965416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1966ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19672e5835c6SStefano Zampini v = aa + diag[i] + 1; 196817ab2063SBarry Smith sum = b[i] * d / omega; 1969003131ecSBarry Smith PetscSparseDensePlusDot(sum, bs, v, idx, n); 197017ab2063SBarry Smith x[i] = sum; 197117ab2063SBarry Smith } 19729566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 19739566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 19749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 19759566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 197717ab2063SBarry Smith } 1978c783ea89SBarry Smith 197908401ef6SPierre Jolivet PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented"); 1980f7d195e4SLawrence Mitchell if (flag & SOR_EISENSTAT) { 19814c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1982887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 198317ab2063SBarry Smith 198417ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 198517ab2063SBarry Smith 1986887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 198717ab2063SBarry Smith */ 198817ab2063SBarry Smith scale = (2.0 / omega) - 1.0; 198917ab2063SBarry Smith 199017ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199117ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 1992416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 1993ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19942e5835c6SStefano Zampini v = aa + diag[i] + 1; 199517ab2063SBarry Smith sum = b[i]; 1996e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 1997ed480e8bSBarry Smith x[i] = sum * idiag[i]; 199817ab2063SBarry Smith } 199917ab2063SBarry Smith 200017ab2063SBarry Smith /* t = b - (2*E - D)x */ 20012e5835c6SStefano Zampini v = aa; 20022205254eSKarl Rupp for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i]; 200317ab2063SBarry Smith 200417ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2005ed480e8bSBarry Smith ts = t; 2006416022c9SBarry Smith diag = a->diag; 200717ab2063SBarry Smith for (i = 0; i < m; i++) { 2008416022c9SBarry Smith n = diag[i] - a->i[i]; 2009ed480e8bSBarry Smith idx = a->j + a->i[i]; 20102e5835c6SStefano Zampini v = aa + a->i[i]; 201117ab2063SBarry Smith sum = t[i]; 2012003131ecSBarry Smith PetscSparseDenseMinusDot(sum, ts, v, idx, n); 2013ed480e8bSBarry Smith t[i] = sum * idiag[i]; 2014733d66baSBarry Smith /* x = x + t */ 2015733d66baSBarry Smith x[i] += t[i]; 201617ab2063SBarry Smith } 201717ab2063SBarry Smith 20189566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz)); 20199566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 20209566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 20213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202217ab2063SBarry Smith } 202317ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 202417ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 202517ab2063SBarry Smith for (i = 0; i < m; i++) { 2026416022c9SBarry Smith n = diag[i] - a->i[i]; 2027ed480e8bSBarry Smith idx = a->j + a->i[i]; 20282e5835c6SStefano Zampini v = aa + a->i[i]; 202917ab2063SBarry Smith sum = b[i]; 2030e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20315c99c7daSBarry Smith t[i] = sum; 2032ed480e8bSBarry Smith x[i] = sum * idiag[i]; 203317ab2063SBarry Smith } 20345c99c7daSBarry Smith xb = t; 20359566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20363a40ed3dSBarry Smith } else xb = b; 203717ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 203817ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2039416022c9SBarry Smith n = a->i[i + 1] - diag[i] - 1; 2040ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20412e5835c6SStefano Zampini v = aa + diag[i] + 1; 204217ab2063SBarry Smith sum = xb[i]; 2043e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 20445c99c7daSBarry Smith if (xb == b) { 2045ed480e8bSBarry Smith x[i] = sum * idiag[i]; 20465c99c7daSBarry Smith } else { 2047b19a5dc2SMark Adams x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 204817ab2063SBarry Smith } 20495c99c7daSBarry Smith } 20509566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205117ab2063SBarry Smith } 205217ab2063SBarry Smith its--; 205317ab2063SBarry Smith } 205417ab2063SBarry Smith while (its--) { 205517ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 205617ab2063SBarry Smith for (i = 0; i < m; i++) { 2057b19a5dc2SMark Adams /* lower */ 2058b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2059ed480e8bSBarry Smith idx = a->j + a->i[i]; 20602e5835c6SStefano Zampini v = aa + a->i[i]; 206117ab2063SBarry Smith sum = b[i]; 2062e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2063b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2064b19a5dc2SMark Adams /* upper */ 2065b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2066b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20672e5835c6SStefano Zampini v = aa + diag[i] + 1; 2068b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2069b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 207017ab2063SBarry Smith } 2071b19a5dc2SMark Adams xb = t; 20729566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2073b19a5dc2SMark Adams } else xb = b; 207417ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 207517ab2063SBarry Smith for (i = m - 1; i >= 0; i--) { 2076b19a5dc2SMark Adams sum = xb[i]; 2077b19a5dc2SMark Adams if (xb == b) { 2078b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2079416022c9SBarry Smith n = a->i[i + 1] - a->i[i]; 2080ed480e8bSBarry Smith idx = a->j + a->i[i]; 20812e5835c6SStefano Zampini v = aa + a->i[i]; 2082e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum, x, v, idx, n); 2083ed480e8bSBarry Smith x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i]; 2084b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2085b19a5dc2SMark Adams n = a->i[i + 1] - diag[i] - 1; 2086b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20872e5835c6SStefano Zampini v = aa + diag[i] + 1; 2088b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum, x, v, idx, n); 2089b19a5dc2SMark Adams x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */ 209017ab2063SBarry Smith } 2091b19a5dc2SMark Adams } 2092b19a5dc2SMark Adams if (xb == b) { 20939566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 2094b19a5dc2SMark Adams } else { 20959566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2096b19a5dc2SMark Adams } 209717ab2063SBarry Smith } 209817ab2063SBarry Smith } 20999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 21009566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx, &x)); 21019566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb, &b)); 21023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 210317ab2063SBarry Smith } 210417ab2063SBarry Smith 2105ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info) 2106d71ae5a4SJacob Faibussowitsch { 2107416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21084e220ebcSLois Curfman McInnes 21093a40ed3dSBarry Smith PetscFunctionBegin; 21104e220ebcSLois Curfman McInnes info->block_size = 1.0; 21113966268fSBarry Smith info->nz_allocated = a->maxnz; 21123966268fSBarry Smith info->nz_used = a->nz; 21133966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21143966268fSBarry Smith info->assemblies = A->num_ass; 21153966268fSBarry Smith info->mallocs = A->info.mallocs; 21164dfa11a4SJacob Faibussowitsch info->memory = 0; /* REVIEW ME */ 2117d5f3da31SBarry Smith if (A->factortype) { 21184e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21194e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21204e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21214e220ebcSLois Curfman McInnes } else { 21224e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21234e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21244e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21254e220ebcSLois Curfman McInnes } 21263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212717ab2063SBarry Smith } 212817ab2063SBarry Smith 2129ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2130d71ae5a4SJacob Faibussowitsch { 2131416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2132c7da8527SEric Chamberland PetscInt i, m = A->rmap->n - 1; 213397b48c8fSBarry Smith const PetscScalar *xx; 21342e5835c6SStefano Zampini PetscScalar *bb, *aa; 2135c7da8527SEric Chamberland PetscInt d = 0; 213617ab2063SBarry Smith 21373a40ed3dSBarry Smith PetscFunctionBegin; 213897b48c8fSBarry Smith if (x && b) { 21399566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 21409566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 214197b48c8fSBarry Smith for (i = 0; i < N; i++) { 2142aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2143447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 214497b48c8fSBarry Smith bb[rows[i]] = diag * xx[rows[i]]; 214597b48c8fSBarry Smith } 21469566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 21479566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 214897b48c8fSBarry Smith } 214997b48c8fSBarry Smith 21509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 2151a9817697SBarry Smith if (a->keepnonzeropattern) { 2152f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2153aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21549566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]])); 2155f1e2ffcdSBarry Smith } 2156f4df32b1SMatthew Knepley if (diag != 0.0) { 2157c7da8527SEric Chamberland for (i = 0; i < N; i++) { 2158c7da8527SEric Chamberland d = rows[i]; 2159447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 216008401ef6SPierre Jolivet PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d); 2161c7da8527SEric Chamberland } 2162f1e2ffcdSBarry Smith for (i = 0; i < N; i++) { 2163447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21642e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2165f1e2ffcdSBarry Smith } 2166f1e2ffcdSBarry Smith } 2167f1e2ffcdSBarry Smith } else { 2168f4df32b1SMatthew Knepley if (diag != 0.0) { 216917ab2063SBarry Smith for (i = 0; i < N; i++) { 2170aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 21717ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2172447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2173447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2174447d62f5SStefano Zampini } else { 2175416022c9SBarry Smith a->ilen[rows[i]] = 1; 21762e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2177bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2178447d62f5SStefano Zampini } 2179447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21809566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 218117ab2063SBarry Smith } 218217ab2063SBarry Smith } 21833a40ed3dSBarry Smith } else { 218417ab2063SBarry Smith for (i = 0; i < N; i++) { 2185aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2186416022c9SBarry Smith a->ilen[rows[i]] = 0; 218717ab2063SBarry Smith } 218817ab2063SBarry Smith } 2189e56f5c9eSBarry Smith A->nonzerostate++; 2190f1e2ffcdSBarry Smith } 21919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2192dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 21933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 219417ab2063SBarry Smith } 219517ab2063SBarry Smith 2196ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b) 2197d71ae5a4SJacob Faibussowitsch { 21986e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 21996e169961SBarry Smith PetscInt i, j, m = A->rmap->n - 1, d = 0; 22002b40b63fSBarry Smith PetscBool missing, *zeroed, vecs = PETSC_FALSE; 22016e169961SBarry Smith const PetscScalar *xx; 22022e5835c6SStefano Zampini PetscScalar *bb, *aa; 22036e169961SBarry Smith 22046e169961SBarry Smith PetscFunctionBegin; 22053ba16761SJacob Faibussowitsch if (!N) PetscFunctionReturn(PETSC_SUCCESS); 22069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &aa)); 22076e169961SBarry Smith if (x && b) { 22089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 22099566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 22102b40b63fSBarry Smith vecs = PETSC_TRUE; 22116e169961SBarry Smith } 22129566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 22136e169961SBarry Smith for (i = 0; i < N; i++) { 2214aed4548fSBarry Smith PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]); 2215*8e3a54c0SPierre Jolivet PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]])); 22162205254eSKarl Rupp 22176e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22186e169961SBarry Smith } 22196e169961SBarry Smith for (i = 0; i < A->rmap->n; i++) { 22206e169961SBarry Smith if (!zeroed[i]) { 22216e169961SBarry Smith for (j = a->i[i]; j < a->i[i + 1]; j++) { 22224cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22232e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j] * xx[a->j[j]]; 22242e5835c6SStefano Zampini aa[j] = 0.0; 22256e169961SBarry Smith } 22266e169961SBarry Smith } 22274cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i]; 22286e169961SBarry Smith } 22296e169961SBarry Smith if (x && b) { 22309566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 22319566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 22326e169961SBarry Smith } 22339566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22346e169961SBarry Smith if (diag != 0.0) { 22359566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d)); 22361d5a398dSstefano_zampini if (missing) { 22371d5a398dSstefano_zampini for (i = 0; i < N; i++) { 22384cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 2239aed4548fSBarry Smith PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]); 22409566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES)); 22411d5a398dSstefano_zampini } 22421d5a398dSstefano_zampini } else { 2243ad540459SPierre Jolivet for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag; 22446e169961SBarry Smith } 22451d5a398dSstefano_zampini } 22469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &aa)); 2247dbbe0bcdSBarry Smith PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY); 22483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22496e169961SBarry Smith } 22506e169961SBarry Smith 2251d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2252d71ae5a4SJacob Faibussowitsch { 2253fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2254fff043a9SJunchao Zhang const PetscScalar *aa; 225517ab2063SBarry Smith 22563a40ed3dSBarry Smith PetscFunctionBegin; 22579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2258416022c9SBarry Smith *nz = a->i[row + 1] - a->i[row]; 2259*8e3a54c0SPierre Jolivet if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]); 226017ab2063SBarry Smith if (idx) { 22615c0db29aSPierre Jolivet if (*nz && a->j) *idx = a->j + a->i[row]; 2262f4259b30SLisandro Dalcin else *idx = NULL; 226317ab2063SBarry Smith } 22649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 22653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 226617ab2063SBarry Smith } 226717ab2063SBarry Smith 2268d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 2269d71ae5a4SJacob Faibussowitsch { 22703a40ed3dSBarry Smith PetscFunctionBegin; 22713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227217ab2063SBarry Smith } 227317ab2063SBarry Smith 2274ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm) 2275d71ae5a4SJacob Faibussowitsch { 2276416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 22772e5835c6SStefano Zampini const MatScalar *v; 227836db0b34SBarry Smith PetscReal sum = 0.0; 227997f1f81fSBarry Smith PetscInt i, j; 228017ab2063SBarry Smith 22813a40ed3dSBarry Smith PetscFunctionBegin; 22829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &v)); 228317ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2284570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2285570b7f6dSBarry Smith PetscBLASInt one = 1, nz = a->nz; 2286792fecdfSBarry Smith PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one)); 2287570b7f6dSBarry Smith #else 2288416022c9SBarry Smith for (i = 0; i < a->nz; i++) { 22899371c9d4SSatish Balay sum += PetscRealPart(PetscConj(*v) * (*v)); 22909371c9d4SSatish Balay v++; 229117ab2063SBarry Smith } 22928f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2293570b7f6dSBarry Smith #endif 22949566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * a->nz)); 22953a40ed3dSBarry Smith } else if (type == NORM_1) { 229636db0b34SBarry Smith PetscReal *tmp; 229797f1f81fSBarry Smith PetscInt *jj = a->j; 22989566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp)); 2299064f8208SBarry Smith *nrm = 0.0; 2300416022c9SBarry Smith for (j = 0; j < a->nz; j++) { 23019371c9d4SSatish Balay tmp[*jj++] += PetscAbsScalar(*v); 23029371c9d4SSatish Balay v++; 230317ab2063SBarry Smith } 2304d0f46423SBarry Smith for (j = 0; j < A->cmap->n; j++) { 2305064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 230617ab2063SBarry Smith } 23079566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23089566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 23093a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2310064f8208SBarry Smith *nrm = 0.0; 2311d0f46423SBarry Smith for (j = 0; j < A->rmap->n; j++) { 2312*8e3a54c0SPierre Jolivet const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]); 231317ab2063SBarry Smith sum = 0.0; 2314416022c9SBarry Smith for (i = 0; i < a->i[j + 1] - a->i[j]; i++) { 23159371c9d4SSatish Balay sum += PetscAbsScalar(*v2); 23169371c9d4SSatish Balay v2++; 231717ab2063SBarry Smith } 2318064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 231917ab2063SBarry Smith } 23209566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0))); 2321f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm"); 23229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &v)); 23233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232417ab2063SBarry Smith } 232517ab2063SBarry Smith 2326ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2327d71ae5a4SJacob Faibussowitsch { 23283d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 232954f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 23302e5835c6SStefano Zampini const MatScalar *va, *vb; 233197f1f81fSBarry Smith PetscInt ma, na, mb, nb, i; 2332cd0d46ebSvictorle 2333cd0d46ebSvictorle PetscFunctionBegin; 23349566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23359566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23365485867bSBarry Smith if (ma != nb || na != mb) { 23375485867bSBarry Smith *f = PETSC_FALSE; 23383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23395485867bSBarry Smith } 23409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &va)); 23419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &vb)); 23429371c9d4SSatish Balay aii = aij->i; 23439371c9d4SSatish Balay bii = bij->i; 23449371c9d4SSatish Balay adx = aij->j; 23459371c9d4SSatish Balay bdx = bij->j; 23469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 2348cd0d46ebSvictorle for (i = 0; i < ma; i++) aptr[i] = aii[i]; 2349cd0d46ebSvictorle for (i = 0; i < mb; i++) bptr[i] = bii[i]; 2350cd0d46ebSvictorle 2351cd0d46ebSvictorle *f = PETSC_TRUE; 2352cd0d46ebSvictorle for (i = 0; i < ma; i++) { 2353cd0d46ebSvictorle while (aptr[i] < aii[i + 1]) { 235497f1f81fSBarry Smith PetscInt idc, idr; 23555485867bSBarry Smith PetscScalar vc, vr; 2356cd0d46ebSvictorle /* column/row index/value */ 23575485867bSBarry Smith idc = adx[aptr[i]]; 23585485867bSBarry Smith idr = bdx[bptr[idc]]; 23595485867bSBarry Smith vc = va[aptr[i]]; 23605485867bSBarry Smith vr = vb[bptr[idc]]; 23615485867bSBarry Smith if (i != idr || PetscAbsScalar(vc - vr) > tol) { 23625485867bSBarry Smith *f = PETSC_FALSE; 23635485867bSBarry Smith goto done; 2364cd0d46ebSvictorle } else { 23655485867bSBarry Smith aptr[i]++; 23665485867bSBarry Smith if (B || i != idc) bptr[idc]++; 2367cd0d46ebSvictorle } 2368cd0d46ebSvictorle } 2369cd0d46ebSvictorle } 2370cd0d46ebSvictorle done: 23719566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 23729566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 23739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &va)); 23749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &vb)); 23753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2376cd0d46ebSvictorle } 2377cd0d46ebSvictorle 2378ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f) 2379d71ae5a4SJacob Faibussowitsch { 23803d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data; 238154f21887SBarry Smith PetscInt *adx, *bdx, *aii, *bii, *aptr, *bptr; 238254f21887SBarry Smith MatScalar *va, *vb; 23831cbb95d3SBarry Smith PetscInt ma, na, mb, nb, i; 23841cbb95d3SBarry Smith 23851cbb95d3SBarry Smith PetscFunctionBegin; 23869566063dSJacob Faibussowitsch PetscCall(MatGetSize(A, &ma, &na)); 23879566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &mb, &nb)); 23881cbb95d3SBarry Smith if (ma != nb || na != mb) { 23891cbb95d3SBarry Smith *f = PETSC_FALSE; 23903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 23911cbb95d3SBarry Smith } 23929371c9d4SSatish Balay aii = aij->i; 23939371c9d4SSatish Balay bii = bij->i; 23949371c9d4SSatish Balay adx = aij->j; 23959371c9d4SSatish Balay bdx = bij->j; 23969371c9d4SSatish Balay va = aij->a; 23979371c9d4SSatish Balay vb = bij->a; 23989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma, &aptr)); 23999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb, &bptr)); 24001cbb95d3SBarry Smith for (i = 0; i < ma; i++) aptr[i] = aii[i]; 24011cbb95d3SBarry Smith for (i = 0; i < mb; i++) bptr[i] = bii[i]; 24021cbb95d3SBarry Smith 24031cbb95d3SBarry Smith *f = PETSC_TRUE; 24041cbb95d3SBarry Smith for (i = 0; i < ma; i++) { 24051cbb95d3SBarry Smith while (aptr[i] < aii[i + 1]) { 24061cbb95d3SBarry Smith PetscInt idc, idr; 24071cbb95d3SBarry Smith PetscScalar vc, vr; 24081cbb95d3SBarry Smith /* column/row index/value */ 24091cbb95d3SBarry Smith idc = adx[aptr[i]]; 24101cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24111cbb95d3SBarry Smith vc = va[aptr[i]]; 24121cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24131cbb95d3SBarry Smith if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) { 24141cbb95d3SBarry Smith *f = PETSC_FALSE; 24151cbb95d3SBarry Smith goto done; 24161cbb95d3SBarry Smith } else { 24171cbb95d3SBarry Smith aptr[i]++; 24181cbb95d3SBarry Smith if (B || i != idc) bptr[idc]++; 24191cbb95d3SBarry Smith } 24201cbb95d3SBarry Smith } 24211cbb95d3SBarry Smith } 24221cbb95d3SBarry Smith done: 24239566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24249566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24261cbb95d3SBarry Smith } 24271cbb95d3SBarry Smith 2428ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2429d71ae5a4SJacob Faibussowitsch { 24309e29f15eSvictorle PetscFunctionBegin; 24319566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f)); 24323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24339e29f15eSvictorle } 24349e29f15eSvictorle 2435ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f) 2436d71ae5a4SJacob Faibussowitsch { 24371cbb95d3SBarry Smith PetscFunctionBegin; 24389566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f)); 24393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 24401cbb95d3SBarry Smith } 24411cbb95d3SBarry Smith 2442d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr) 2443d71ae5a4SJacob Faibussowitsch { 2444416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2445fff8e43fSBarry Smith const PetscScalar *l, *r; 2446fff8e43fSBarry Smith PetscScalar x; 244754f21887SBarry Smith MatScalar *v; 2448fff8e43fSBarry Smith PetscInt i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz; 2449fff8e43fSBarry Smith const PetscInt *jj; 245017ab2063SBarry Smith 24513a40ed3dSBarry Smith PetscFunctionBegin; 245217ab2063SBarry Smith if (ll) { 24533ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 24543ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 24559566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll, &m)); 245608401ef6SPierre Jolivet PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length"); 24579566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll, &l)); 24589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 245917ab2063SBarry Smith for (i = 0; i < m; i++) { 246017ab2063SBarry Smith x = l[i]; 2461416022c9SBarry Smith M = a->i[i + 1] - a->i[i]; 24622205254eSKarl Rupp for (j = 0; j < M; j++) (*v++) *= x; 246317ab2063SBarry Smith } 24649566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll, &l)); 24659566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 24669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 246717ab2063SBarry Smith } 246817ab2063SBarry Smith if (rr) { 24699566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr, &n)); 247008401ef6SPierre Jolivet PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length"); 24719566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr, &r)); 24729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &v)); 24732e5835c6SStefano Zampini jj = a->j; 24742205254eSKarl Rupp for (i = 0; i < nz; i++) (*v++) *= r[*jj++]; 24759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &v)); 24769566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr, &r)); 24779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 247817ab2063SBarry Smith } 24799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 24803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 248117ab2063SBarry Smith } 248217ab2063SBarry Smith 2483d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B) 2484d71ae5a4SJacob Faibussowitsch { 2485db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *c; 2486d0f46423SBarry Smith PetscInt *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens; 248797f1f81fSBarry Smith PetscInt row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi; 24885d0c19d7SBarry Smith const PetscInt *irow, *icol; 24892e5835c6SStefano Zampini const PetscScalar *aa; 24905d0c19d7SBarry Smith PetscInt nrows, ncols; 249197f1f81fSBarry Smith PetscInt *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen; 2492fb3c7e2dSJunchao Zhang MatScalar *a_new, *mat_a, *c_a; 2493416022c9SBarry Smith Mat C; 2494cdc6f3adSToby Isaac PetscBool stride; 249517ab2063SBarry Smith 24963a40ed3dSBarry Smith PetscFunctionBegin; 24979566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow, &irow)); 24989566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow, &nrows)); 24999566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol, &ncols)); 250017ab2063SBarry Smith 25019566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride)); 2502ff718158SBarry Smith if (stride) { 25039566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol, &first, &step)); 2504ff718158SBarry Smith } else { 2505ff718158SBarry Smith first = 0; 2506ff718158SBarry Smith step = 0; 2507ff718158SBarry Smith } 2508fee21e36SBarry Smith if (stride && step == 1) { 250902834360SBarry Smith /* special case of contiguous rows */ 25109566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts)); 251102834360SBarry Smith /* loop over new rows determining lens and starting points */ 251202834360SBarry Smith for (i = 0; i < nrows; i++) { 2513bfeeae90SHong Zhang kstart = ai[irow[i]]; 2514a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2515a91a9bebSLisandro Dalcin starts[i] = kstart; 251602834360SBarry Smith for (k = kstart; k < kend; k++) { 2517bfeeae90SHong Zhang if (aj[k] >= first) { 251802834360SBarry Smith starts[i] = k; 251902834360SBarry Smith break; 252002834360SBarry Smith } 252102834360SBarry Smith } 2522a2744918SBarry Smith sum = 0; 252302834360SBarry Smith while (k < kend) { 2524bfeeae90SHong Zhang if (aj[k++] >= first + ncols) break; 2525a2744918SBarry Smith sum++; 252602834360SBarry Smith } 2527a2744918SBarry Smith lens[i] = sum; 252802834360SBarry Smith } 252902834360SBarry Smith /* create submatrix */ 2530cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 253197f1f81fSBarry Smith PetscInt n_cols, n_rows; 25329566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B, &n_rows, &n_cols)); 2533aed4548fSBarry Smith PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size"); 25349566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 253508480c60SBarry Smith C = *B; 25363a40ed3dSBarry Smith } else { 25373bef6203SJed Brown PetscInt rbs, cbs; 25389566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25409566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 25419566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 25429566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C, rbs, cbs)); 25439566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 25449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 254508480c60SBarry Smith } 2546db02288aSLois Curfman McInnes c = (Mat_SeqAIJ *)C->data; 2547db02288aSLois Curfman McInnes 254802834360SBarry Smith /* loop over rows inserting into submatrix */ 2549fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C 2550db02288aSLois Curfman McInnes j_new = c->j; 2551db02288aSLois Curfman McInnes i_new = c->i; 25529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 255302834360SBarry Smith for (i = 0; i < nrows; i++) { 2554a2744918SBarry Smith ii = starts[i]; 2555a2744918SBarry Smith lensi = lens[i]; 2556810441c8SPierre Jolivet if (lensi) { 2557ad540459SPierre Jolivet for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first; 25589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi)); 2559a2744918SBarry Smith a_new += lensi; 2560810441c8SPierre Jolivet } 2561a2744918SBarry Smith i_new[i + 1] = i_new[i] + lensi; 2562a2744918SBarry Smith c->ilen[i] = lensi; 256302834360SBarry Smith } 2564fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly 25659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 25669566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens, starts)); 25673a40ed3dSBarry Smith } else { 25689566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol, &icol)); 25699566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols, &smap)); 25709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1 + nrows, &lens)); 25714dcab191SBarry Smith for (i = 0; i < ncols; i++) { 25726bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols); 25734dcab191SBarry Smith smap[icol[i]] = i + 1; 25744dcab191SBarry Smith } 25754dcab191SBarry Smith 257602834360SBarry Smith /* determine lens of each row */ 257702834360SBarry Smith for (i = 0; i < nrows; i++) { 2578bfeeae90SHong Zhang kstart = ai[irow[i]]; 257902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 258002834360SBarry Smith lens[i] = 0; 258102834360SBarry Smith for (k = kstart; k < kend; k++) { 2582ad540459SPierre Jolivet if (smap[aj[k]]) lens[i]++; 258302834360SBarry Smith } 258402834360SBarry Smith } 258517ab2063SBarry Smith /* Create and fill new matrix */ 2586a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2587ace3abfcSBarry Smith PetscBool equal; 25880f5bd95cSBarry Smith 258999141d43SSatish Balay c = (Mat_SeqAIJ *)((*B)->data); 2590aed4548fSBarry Smith PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size"); 25919566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal)); 2592fdfbdca6SPierre Jolivet PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros"); 25939566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n)); 259408480c60SBarry Smith C = *B; 25953a40ed3dSBarry Smith } else { 25963bef6203SJed Brown PetscInt rbs, cbs; 25979566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 25989566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE)); 25999566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow, &rbs)); 26009566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol, &cbs)); 260137a5e0faSPierre Jolivet if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs)); 26029566063dSJacob Faibussowitsch PetscCall(MatSetType(C, ((PetscObject)A)->type_name)); 26039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens)); 260408480c60SBarry Smith } 26059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 2606fb3c7e2dSJunchao Zhang 260799141d43SSatish Balay c = (Mat_SeqAIJ *)(C->data); 2608fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C 260917ab2063SBarry Smith for (i = 0; i < nrows; i++) { 261099141d43SSatish Balay row = irow[i]; 2611bfeeae90SHong Zhang kstart = ai[row]; 261299141d43SSatish Balay kend = kstart + a->ilen[row]; 2613bfeeae90SHong Zhang mat_i = c->i[i]; 2614*8e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 2615*8e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 261699141d43SSatish Balay mat_ilen = c->ilen + i; 261717ab2063SBarry Smith for (k = kstart; k < kend; k++) { 2618bfeeae90SHong Zhang if ((tcol = smap[a->j[k]])) { 2619ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26202e5835c6SStefano Zampini *mat_a++ = aa[k]; 262199141d43SSatish Balay (*mat_ilen)++; 262217ab2063SBarry Smith } 262317ab2063SBarry Smith } 262417ab2063SBarry Smith } 26259566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 262602834360SBarry Smith /* Free work space */ 26279566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol, &icol)); 26289566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26299566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2630cdc6f3adSToby Isaac /* sort */ 2631cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2632cdc6f3adSToby Isaac PetscInt ilen; 2633cdc6f3adSToby Isaac 2634cdc6f3adSToby Isaac mat_i = c->i[i]; 2635*8e3a54c0SPierre Jolivet mat_j = PetscSafePointerPlusOffset(c->j, mat_i); 2636*8e3a54c0SPierre Jolivet mat_a = PetscSafePointerPlusOffset(c_a, mat_i); 2637cdc6f3adSToby Isaac ilen = c->ilen[i]; 26389566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a)); 2639cdc6f3adSToby Isaac } 2640fb3c7e2dSJunchao Zhang PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a)); 264102834360SBarry Smith } 26428c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26439566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C, A->boundtocpu)); 2644305c6ccfSStefano Zampini #endif 26459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY)); 26469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY)); 264717ab2063SBarry Smith 26489566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow, &irow)); 2649416022c9SBarry Smith *B = C; 26503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 265117ab2063SBarry Smith } 265217ab2063SBarry Smith 2653ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat) 2654d71ae5a4SJacob Faibussowitsch { 265582d44351SHong Zhang Mat B; 265682d44351SHong Zhang 265782d44351SHong Zhang PetscFunctionBegin; 2658c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 26599566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm, &B)); 26609566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n)); 26619566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, mat, mat)); 26629566063dSJacob Faibussowitsch PetscCall(MatSetType(B, MATSEQAIJ)); 26639566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE)); 266482d44351SHong Zhang *subMat = B; 2665c2d650bdSHong Zhang } else { 26669566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN)); 2667c2d650bdSHong Zhang } 26683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 266982d44351SHong Zhang } 267082d44351SHong Zhang 2671ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info) 2672d71ae5a4SJacob Faibussowitsch { 267363b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 267463b91edcSBarry Smith Mat outA; 2675ace3abfcSBarry Smith PetscBool row_identity, col_identity; 267663b91edcSBarry Smith 26773a40ed3dSBarry Smith PetscFunctionBegin; 267808401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu"); 26791df811f5SHong Zhang 26809566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 26819566063dSJacob Faibussowitsch PetscCall(ISIdentity(col, &col_identity)); 2682a871dcd8SBarry Smith 268363b91edcSBarry Smith outA = inA; 2684d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 26859566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 26869566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 26872205254eSKarl Rupp 26889566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 26899566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 26902205254eSKarl Rupp 2691c3122656SLisandro Dalcin a->row = row; 26922205254eSKarl Rupp 26939566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 26949566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 26952205254eSKarl Rupp 2696c3122656SLisandro Dalcin a->col = col; 269763b91edcSBarry Smith 269836db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26999566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27009566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol)); 2701f0ec6fceSSatish Balay 270294a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work)); 270494a9d846SBarry Smith } 270563b91edcSBarry Smith 27069566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2707137fb511SHong Zhang if (row_identity && col_identity) { 27089566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info)); 2709137fb511SHong Zhang } else { 27109566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info)); 2711137fb511SHong Zhang } 27123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2713a871dcd8SBarry Smith } 2714a871dcd8SBarry Smith 2715d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha) 2716d71ae5a4SJacob Faibussowitsch { 2717f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data; 2718dfa0f9e5SStefano Zampini PetscScalar *v; 2719c5df96a5SBarry Smith PetscBLASInt one = 1, bnz; 27203a40ed3dSBarry Smith 27213a40ed3dSBarry Smith PetscFunctionBegin; 27229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA, &v)); 27239566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz, &bnz)); 2724792fecdfSBarry Smith PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one)); 27259566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA, &v)); 27279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2729f0b747eeSBarry Smith } 2730f0b747eeSBarry Smith 2731d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 2732d71ae5a4SJacob Faibussowitsch { 273316b64355SHong Zhang PetscInt i; 273416b64355SHong Zhang 273516b64355SHong Zhang PetscFunctionBegin; 273616b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27379566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr)); 273816b64355SHong Zhang 273948a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i])); 27409566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1)); 274116b64355SHong Zhang 274216b64355SHong Zhang if (submatj->rbuf1) { 27439566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27449566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 274516b64355SHong Zhang } 274616b64355SHong Zhang 274748a46eb9SPierre Jolivet for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i])); 27489566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3)); 27499566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 275016b64355SHong Zhang } 275116b64355SHong Zhang 275216b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2753eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&submatj->rmap)); 27549566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 27559566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 275616b64355SHong Zhang #else 27579566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 275816b64355SHong Zhang #endif 275916b64355SHong Zhang 276016b64355SHong Zhang if (!submatj->allcolumns) { 276116b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 2762eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap)); 276316b64355SHong Zhang #else 27649566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 276516b64355SHong Zhang #endif 276616b64355SHong Zhang } 27679566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 276816b64355SHong Zhang 27699566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 27703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 277116b64355SHong Zhang } 277216b64355SHong Zhang 2773d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 2774d71ae5a4SJacob Faibussowitsch { 277516b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data; 27765c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 277716b64355SHong Zhang 277816b64355SHong Zhang PetscFunctionBegin; 27799566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 27809566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 27813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 278216b64355SHong Zhang } 278316b64355SHong Zhang 278489a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */ 2785ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[]) 2786d71ae5a4SJacob Faibussowitsch { 27872d033e1fSHong Zhang PetscInt i; 27880fb991dcSHong Zhang Mat C; 27890fb991dcSHong Zhang Mat_SeqAIJ *c; 27900fb991dcSHong Zhang Mat_SubSppt *submatj; 27912d033e1fSHong Zhang 27922d033e1fSHong Zhang PetscFunctionBegin; 27932d033e1fSHong Zhang for (i = 0; i < n; i++) { 27940fb991dcSHong Zhang C = (*mat)[i]; 27950fb991dcSHong Zhang c = (Mat_SeqAIJ *)C->data; 27960fb991dcSHong Zhang submatj = c->submatis1; 27972d033e1fSHong Zhang if (submatj) { 2798682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 279926cc229bSBarry Smith PetscCall(PetscFree(C->factorprefix)); 28009566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28019566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28029566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28033faff063SStefano Zampini PetscCall(PetscFree(C->defaultrandtype)); 28049566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28059566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28069566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2807682e4c99SStefano Zampini } 28082d033e1fSHong Zhang } else { 28099566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28102d033e1fSHong Zhang } 28112d033e1fSHong Zhang } 281286e85357SHong Zhang 281363a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28149566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n, mat)); 281563a75b2aSHong Zhang 28169566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28182d033e1fSHong Zhang } 28192d033e1fSHong Zhang 2820ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[]) 2821d71ae5a4SJacob Faibussowitsch { 282297f1f81fSBarry Smith PetscInt i; 2823cddf8d76SBarry Smith 28243a40ed3dSBarry Smith PetscFunctionBegin; 282548a46eb9SPierre Jolivet if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B)); 2826cddf8d76SBarry Smith 282748a46eb9SPierre Jolivet for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i])); 28283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2829cddf8d76SBarry Smith } 2830cddf8d76SBarry Smith 2831ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov) 2832d71ae5a4SJacob Faibussowitsch { 2833e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 28349a88ca10SBarry Smith PetscInt row, i, j, k, l, ll, m, n, *nidx, isz, val; 28355d0c19d7SBarry Smith const PetscInt *idx; 28369a88ca10SBarry Smith PetscInt start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1; 2837f1af5d2fSBarry Smith PetscBT table; 2838bbd702dbSSatish Balay 28393a40ed3dSBarry Smith PetscFunctionBegin; 28409a88ca10SBarry Smith m = A->rmap->n / bs; 2841e4d965acSSatish Balay ai = a->i; 2842bfeeae90SHong Zhang aj = a->j; 28438a047759SSatish Balay 284408401ef6SPierre Jolivet PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used"); 284506763907SSatish Balay 28469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nidx)); 28479566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m, &table)); 284806763907SSatish Balay 2849e4d965acSSatish Balay for (i = 0; i < is_max; i++) { 2850b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2851e4d965acSSatish Balay isz = 0; 28529566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m, table)); 2853e4d965acSSatish Balay 2854e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28559566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i], &idx)); 28569566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i], &n)); 2857e4d965acSSatish Balay 28589a88ca10SBarry Smith if (bs > 1) { 28599a88ca10SBarry Smith /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 28609a88ca10SBarry Smith for (j = 0; j < n; ++j) { 28619a88ca10SBarry Smith if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs; 28629a88ca10SBarry Smith } 28639a88ca10SBarry Smith PetscCall(ISRestoreIndices(is[i], &idx)); 28649a88ca10SBarry Smith PetscCall(ISDestroy(&is[i])); 28659a88ca10SBarry Smith 28669a88ca10SBarry Smith k = 0; 28679a88ca10SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 28689a88ca10SBarry Smith n = isz; 28699a88ca10SBarry Smith for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 28709a88ca10SBarry Smith for (ll = 0; ll < bs; ll++) { 28719a88ca10SBarry Smith row = bs * nidx[k] + ll; 28729a88ca10SBarry Smith start = ai[row]; 28739a88ca10SBarry Smith end = ai[row + 1]; 28749a88ca10SBarry Smith for (l = start; l < end; l++) { 28759a88ca10SBarry Smith val = aj[l] / bs; 28769a88ca10SBarry Smith if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 28779a88ca10SBarry Smith } 28789a88ca10SBarry Smith } 28799a88ca10SBarry Smith } 28809a88ca10SBarry Smith } 28819a88ca10SBarry Smith PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i))); 28829a88ca10SBarry Smith } else { 2883dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2884e4d965acSSatish Balay for (j = 0; j < n; ++j) { 28852205254eSKarl Rupp if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j]; 28864dcbc457SBarry Smith } 28879566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i], &idx)); 28889566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2889e4d965acSSatish Balay 289004a348a9SBarry Smith k = 0; 289104a348a9SBarry Smith for (j = 0; j < ov; j++) { /* for each overlap */ 289204a348a9SBarry Smith n = isz; 289306763907SSatish Balay for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2894e4d965acSSatish Balay row = nidx[k]; 2895e4d965acSSatish Balay start = ai[row]; 2896e4d965acSSatish Balay end = ai[row + 1]; 289704a348a9SBarry Smith for (l = start; l < end; l++) { 2898efb16452SHong Zhang val = aj[l]; 28992205254eSKarl Rupp if (!PetscBTLookupSet(table, val)) nidx[isz++] = val; 2900e4d965acSSatish Balay } 2901e4d965acSSatish Balay } 2902e4d965acSSatish Balay } 29039566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i))); 2904e4d965acSSatish Balay } 29059a88ca10SBarry Smith } 29069566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29079566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29094dcbc457SBarry Smith } 291017ab2063SBarry Smith 2911ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B) 2912d71ae5a4SJacob Faibussowitsch { 29130513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29143b98c0a2SBarry Smith PetscInt i, nz = 0, m = A->rmap->n, n = A->cmap->n; 29155d0c19d7SBarry Smith const PetscInt *row, *col; 29165d0c19d7SBarry Smith PetscInt *cnew, j, *lens; 291756cd22aeSBarry Smith IS icolp, irowp; 29180298fd71SBarry Smith PetscInt *cwork = NULL; 29190298fd71SBarry Smith PetscScalar *vwork = NULL; 29200513a670SBarry Smith 29213a40ed3dSBarry Smith PetscFunctionBegin; 29229566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp)); 29239566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp, &row)); 29249566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp)); 29259566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp, &col)); 29260513a670SBarry Smith 29270513a670SBarry Smith /* determine lengths of permuted rows */ 29289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &lens)); 29292205254eSKarl Rupp for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i]; 29309566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 29319566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, m, n, m, n)); 29329566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 29339566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 29349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens)); 29359566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29360513a670SBarry Smith 29379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n, &cnew)); 29380513a670SBarry Smith for (i = 0; i < m; i++) { 29399566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29402205254eSKarl Rupp for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]]; 29419566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES)); 29429566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork)); 29430513a670SBarry Smith } 29449566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29452205254eSKarl Rupp 29463c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29472205254eSKarl Rupp 29488c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29499566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B, A->boundtocpu)); 29509fe5e383SStefano Zampini #endif 29519566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY)); 29529566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY)); 29539566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp, &row)); 29549566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp, &col)); 29559566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29569566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 295748a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B)); 29583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29590513a670SBarry Smith } 29600513a670SBarry Smith 2961d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str) 2962d71ae5a4SJacob Faibussowitsch { 2963cb5b572fSBarry Smith PetscFunctionBegin; 296433f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 296533f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2966be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 2967be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 29682e5835c6SStefano Zampini const PetscScalar *aa; 2969be6bf707SBarry Smith 29709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 297108401ef6SPierre Jolivet PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]); 29729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n])); 29739566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 29749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 2975cb5b572fSBarry Smith } else { 29769566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 2977cb5b572fSBarry Smith } 29783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2979cb5b572fSBarry Smith } 2980cb5b572fSBarry Smith 2981d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[]) 2982d71ae5a4SJacob Faibussowitsch { 29836c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 29846e111a19SKarl Rupp 29856c0721eeSBarry Smith PetscFunctionBegin; 29866c0721eeSBarry Smith *array = a->a; 29873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29886c0721eeSBarry Smith } 29896c0721eeSBarry Smith 2990d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[]) 2991d71ae5a4SJacob Faibussowitsch { 29926c0721eeSBarry Smith PetscFunctionBegin; 2993f38c1e66SStefano Zampini *array = NULL; 29943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29956c0721eeSBarry Smith } 2996273d9f13SBarry Smith 29978229c054SShri Abhyankar /* 29988229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29998229c054SShri Abhyankar have different nonzero structure. 30008229c054SShri Abhyankar */ 3001d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz) 3002d71ae5a4SJacob Faibussowitsch { 3003b264fe52SHong Zhang PetscInt i, j, k, nzx, nzy; 3004ec7775f6SShri Abhyankar 3005ec7775f6SShri Abhyankar PetscFunctionBegin; 3006ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3007ec7775f6SShri Abhyankar for (i = 0; i < m; i++) { 3008*8e3a54c0SPierre Jolivet const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]); 3009b264fe52SHong Zhang nzx = xi[i + 1] - xi[i]; 3010b264fe52SHong Zhang nzy = yi[i + 1] - yi[i]; 30118af7cee1SJed Brown nnz[i] = 0; 30128af7cee1SJed Brown for (j = 0, k = 0; j < nzx; j++) { /* Point in X */ 3013b264fe52SHong Zhang for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3014b264fe52SHong Zhang if (k < nzy && yjj[k] == xjj[j]) k++; /* Skip duplicate */ 30158af7cee1SJed Brown nnz[i]++; 30168af7cee1SJed Brown } 30178af7cee1SJed Brown for (; k < nzy; k++) nnz[i]++; 3018ec7775f6SShri Abhyankar } 30193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3020ec7775f6SShri Abhyankar } 3021ec7775f6SShri Abhyankar 3022d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz) 3023d71ae5a4SJacob Faibussowitsch { 3024b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3025b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data; 3026b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data; 3027b264fe52SHong Zhang 3028b264fe52SHong Zhang PetscFunctionBegin; 3029b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30309566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz)); 30313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3032b264fe52SHong Zhang } 3033b264fe52SHong Zhang 3034d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 3035d71ae5a4SJacob Faibussowitsch { 3036ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data; 3037ac90fabeSBarry Smith 3038ac90fabeSBarry Smith PetscFunctionBegin; 3039134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3040134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3041134adf20SPierre Jolivet if (e) { 30429566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e)); 304381fa06acSBarry Smith if (e) { 30449566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e)); 3045134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 304681fa06acSBarry Smith } 304781fa06acSBarry Smith } 304854c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 304981fa06acSBarry Smith } 3050ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30512e5835c6SStefano Zampini const PetscScalar *xa; 30522e5835c6SStefano Zampini PetscScalar *ya, alpha = a; 305381fa06acSBarry Smith PetscBLASInt one = 1, bnz; 305481fa06acSBarry Smith 30559566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz, &bnz)); 30569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y, &ya)); 30579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X, &xa)); 3058792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one)); 30599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X, &xa)); 30609566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y, &ya)); 30619566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0 * bnz)); 30629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 30639566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3064ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 30659566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 3066ac90fabeSBarry Smith } else { 30678229c054SShri Abhyankar Mat B; 30688229c054SShri Abhyankar PetscInt *nnz; 30699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 30709566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 30719566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 30729566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap)); 30739566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 30749566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz)); 30759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 30769566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 30779566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 30789bb234a9SBarry Smith PetscCall(MatSeqAIJCheckInode(Y)); 30799566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3080ac90fabeSBarry Smith } 30813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3082ac90fabeSBarry Smith } 3083ac90fabeSBarry Smith 3084d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3085d71ae5a4SJacob Faibussowitsch { 3086354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3087354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3088354c94deSBarry Smith PetscInt i, nz; 3089354c94deSBarry Smith PetscScalar *a; 3090354c94deSBarry Smith 3091354c94deSBarry Smith PetscFunctionBegin; 3092354c94deSBarry Smith nz = aij->nz; 30939566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat, &a)); 30942205254eSKarl Rupp for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]); 30959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat, &a)); 3096354c94deSBarry Smith #else 3097354c94deSBarry Smith PetscFunctionBegin; 3098354c94deSBarry Smith #endif 30993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3100354c94deSBarry Smith } 3101354c94deSBarry Smith 3102ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3103d71ae5a4SJacob Faibussowitsch { 3104e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3105d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3106e34fafa9SBarry Smith PetscReal atmp; 3107985db425SBarry Smith PetscScalar *x; 3108ce496241SStefano Zampini const MatScalar *aa, *av; 3109e34fafa9SBarry Smith 3110e34fafa9SBarry Smith PetscFunctionBegin; 311128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31129566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3113ce496241SStefano Zampini aa = av; 3114e34fafa9SBarry Smith ai = a->i; 3115e34fafa9SBarry Smith aj = a->j; 3116e34fafa9SBarry Smith 31179566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31189566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31199566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 312008401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3121e34fafa9SBarry Smith for (i = 0; i < m; i++) { 31229371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31239371c9d4SSatish Balay ai++; 3124e34fafa9SBarry Smith for (j = 0; j < ncols; j++) { 3125985db425SBarry Smith atmp = PetscAbsScalar(*aa); 31269371c9d4SSatish Balay if (PetscAbsScalar(x[i]) < atmp) { 31279371c9d4SSatish Balay x[i] = atmp; 31289371c9d4SSatish Balay if (idx) idx[i] = *aj; 31299371c9d4SSatish Balay } 31309371c9d4SSatish Balay aa++; 31319371c9d4SSatish Balay aj++; 3132985db425SBarry Smith } 3133985db425SBarry Smith } 31349566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3137985db425SBarry Smith } 3138985db425SBarry Smith 3139ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3140d71ae5a4SJacob Faibussowitsch { 3141985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3142d0f46423SBarry Smith PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3143985db425SBarry Smith PetscScalar *x; 3144ce496241SStefano Zampini const MatScalar *aa, *av; 3145985db425SBarry Smith 3146985db425SBarry Smith PetscFunctionBegin; 314728b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 31489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3149ce496241SStefano Zampini aa = av; 3150985db425SBarry Smith ai = a->i; 3151985db425SBarry Smith aj = a->j; 3152985db425SBarry Smith 31539566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 31549566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 31559566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 315608401ef6SPierre Jolivet PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3157985db425SBarry Smith for (i = 0; i < m; i++) { 31589371c9d4SSatish Balay ncols = ai[1] - ai[0]; 31599371c9d4SSatish Balay ai++; 3160d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 31619371c9d4SSatish Balay x[i] = *aa; 31629371c9d4SSatish Balay if (idx) idx[i] = 0; 3163985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3164985db425SBarry Smith x[i] = 0.0; 3165985db425SBarry Smith if (idx) { 3166985db425SBarry Smith for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */ 3167985db425SBarry Smith if (aj[j] > j) { 3168985db425SBarry Smith idx[i] = j; 3169985db425SBarry Smith break; 3170985db425SBarry Smith } 3171985db425SBarry Smith } 31721a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 31731a254869SHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3174985db425SBarry Smith } 3175985db425SBarry Smith } 3176985db425SBarry Smith for (j = 0; j < ncols; j++) { 31779371c9d4SSatish Balay if (PetscRealPart(x[i]) < PetscRealPart(*aa)) { 31789371c9d4SSatish Balay x[i] = *aa; 31799371c9d4SSatish Balay if (idx) idx[i] = *aj; 31809371c9d4SSatish Balay } 31819371c9d4SSatish Balay aa++; 31829371c9d4SSatish Balay aj++; 3183985db425SBarry Smith } 3184985db425SBarry Smith } 31859566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 31869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 31873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3188985db425SBarry Smith } 3189985db425SBarry Smith 3190ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3191d71ae5a4SJacob Faibussowitsch { 3192c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3193c87e5d42SMatthew Knepley PetscInt i, j, m = A->rmap->n, *ai, *aj, ncols, n; 3194ce496241SStefano Zampini PetscScalar *x; 3195ce496241SStefano Zampini const MatScalar *aa, *av; 3196c87e5d42SMatthew Knepley 3197c87e5d42SMatthew Knepley PetscFunctionBegin; 31989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3199ce496241SStefano Zampini aa = av; 3200c87e5d42SMatthew Knepley ai = a->i; 3201c87e5d42SMatthew Knepley aj = a->j; 3202c87e5d42SMatthew Knepley 32039566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32049566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32059566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 320608401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3207c87e5d42SMatthew Knepley for (i = 0; i < m; i++) { 32089371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32099371c9d4SSatish Balay ai++; 3210f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 32119371c9d4SSatish Balay x[i] = *aa; 32129371c9d4SSatish Balay if (idx) idx[i] = 0; 3213f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3214f07e67edSHong Zhang x[i] = 0.0; 3215f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3216289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3217f07e67edSHong Zhang if (aj[j] > j) { 3218f07e67edSHong Zhang idx[i] = j; 32192205254eSKarl Rupp break; 32202205254eSKarl Rupp } 3221289a08f5SMatthew Knepley } 3222f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3223f07e67edSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3224f07e67edSHong Zhang } 3225289a08f5SMatthew Knepley } 3226c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 32279371c9d4SSatish Balay if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) { 32289371c9d4SSatish Balay x[i] = *aa; 32299371c9d4SSatish Balay if (idx) idx[i] = *aj; 32309371c9d4SSatish Balay } 32319371c9d4SSatish Balay aa++; 32329371c9d4SSatish Balay aj++; 3233c87e5d42SMatthew Knepley } 3234c87e5d42SMatthew Knepley } 32359566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3238c87e5d42SMatthew Knepley } 3239c87e5d42SMatthew Knepley 3240ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[]) 3241d71ae5a4SJacob Faibussowitsch { 3242985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 3243d9ca1df4SBarry Smith PetscInt i, j, m = A->rmap->n, ncols, n; 3244d9ca1df4SBarry Smith const PetscInt *ai, *aj; 3245985db425SBarry Smith PetscScalar *x; 3246ce496241SStefano Zampini const MatScalar *aa, *av; 3247985db425SBarry Smith 3248985db425SBarry Smith PetscFunctionBegin; 324928b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 32509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &av)); 3251ce496241SStefano Zampini aa = av; 3252985db425SBarry Smith ai = a->i; 3253985db425SBarry Smith aj = a->j; 3254985db425SBarry Smith 32559566063dSJacob Faibussowitsch PetscCall(VecSet(v, 0.0)); 32569566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v, &x)); 32579566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v, &n)); 325808401ef6SPierre Jolivet PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector"); 3259985db425SBarry Smith for (i = 0; i < m; i++) { 32609371c9d4SSatish Balay ncols = ai[1] - ai[0]; 32619371c9d4SSatish Balay ai++; 3262d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 32639371c9d4SSatish Balay x[i] = *aa; 32649371c9d4SSatish Balay if (idx) idx[i] = 0; 3265985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3266985db425SBarry Smith x[i] = 0.0; 3267985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3268985db425SBarry Smith for (j = 0; j < ncols; j++) { 3269985db425SBarry Smith if (aj[j] > j) { 3270985db425SBarry Smith idx[i] = j; 3271985db425SBarry Smith break; 3272985db425SBarry Smith } 3273985db425SBarry Smith } 3274fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3275fa213d2fSHong Zhang if (j == ncols && j < A->cmap->n) idx[i] = j; 3276985db425SBarry Smith } 3277985db425SBarry Smith } 3278985db425SBarry Smith for (j = 0; j < ncols; j++) { 32799371c9d4SSatish Balay if (PetscRealPart(x[i]) > PetscRealPart(*aa)) { 32809371c9d4SSatish Balay x[i] = *aa; 32819371c9d4SSatish Balay if (idx) idx[i] = *aj; 32829371c9d4SSatish Balay } 32839371c9d4SSatish Balay aa++; 32849371c9d4SSatish Balay aj++; 3285e34fafa9SBarry Smith } 3286e34fafa9SBarry Smith } 32879566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v, &x)); 32889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &av)); 32893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3290e34fafa9SBarry Smith } 3291bbead8a2SBarry Smith 3292ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values) 3293d71ae5a4SJacob Faibussowitsch { 3294bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 329533d57670SJed Brown PetscInt i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j; 3296bbead8a2SBarry Smith MatScalar *diag, work[25], *v_work; 32970da83c2eSBarry Smith const PetscReal shift = 0.0; 32981a9391e3SHong Zhang PetscBool allowzeropivot, zeropivotdetected = PETSC_FALSE; 3299bbead8a2SBarry Smith 3300bbead8a2SBarry Smith PetscFunctionBegin; 3301a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33024a0d0026SBarry Smith if (a->ibdiagvalid) { 33034a0d0026SBarry Smith if (values) *values = a->ibdiag; 33043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33054a0d0026SBarry Smith } 33069566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 33074dfa11a4SJacob Faibussowitsch if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); } 3308bbead8a2SBarry Smith diag = a->ibdiag; 3309bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3310bbead8a2SBarry Smith /* factor and invert each block */ 3311bbead8a2SBarry Smith switch (bs) { 3312bbead8a2SBarry Smith case 1: 3313bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33149566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i)); 3315ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3316ec1892c8SHong Zhang if (allowzeropivot) { 33177b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33187b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33197b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33209566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON)); 332198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON); 3322ec1892c8SHong Zhang } 3323bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3324bbead8a2SBarry Smith } 3325bbead8a2SBarry Smith break; 3326bbead8a2SBarry Smith case 2: 3327bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33289371c9d4SSatish Balay ij[0] = 2 * i; 33299371c9d4SSatish Balay ij[1] = 2 * i + 1; 33309566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 2, ij, 2, ij, diag)); 33319566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected)); 33327b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33339566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3334bbead8a2SBarry Smith diag += 4; 3335bbead8a2SBarry Smith } 3336bbead8a2SBarry Smith break; 3337bbead8a2SBarry Smith case 3: 3338bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33399371c9d4SSatish Balay ij[0] = 3 * i; 33409371c9d4SSatish Balay ij[1] = 3 * i + 1; 33419371c9d4SSatish Balay ij[2] = 3 * i + 2; 33429566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 3, ij, 3, ij, diag)); 33439566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected)); 33447b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33459566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3346bbead8a2SBarry Smith diag += 9; 3347bbead8a2SBarry Smith } 3348bbead8a2SBarry Smith break; 3349bbead8a2SBarry Smith case 4: 3350bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33519371c9d4SSatish Balay ij[0] = 4 * i; 33529371c9d4SSatish Balay ij[1] = 4 * i + 1; 33539371c9d4SSatish Balay ij[2] = 4 * i + 2; 33549371c9d4SSatish Balay ij[3] = 4 * i + 3; 33559566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 4, ij, 4, ij, diag)); 33569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected)); 33577b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33589566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3359bbead8a2SBarry Smith diag += 16; 3360bbead8a2SBarry Smith } 3361bbead8a2SBarry Smith break; 3362bbead8a2SBarry Smith case 5: 3363bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33649371c9d4SSatish Balay ij[0] = 5 * i; 33659371c9d4SSatish Balay ij[1] = 5 * i + 1; 33669371c9d4SSatish Balay ij[2] = 5 * i + 2; 33679371c9d4SSatish Balay ij[3] = 5 * i + 3; 33689371c9d4SSatish Balay ij[4] = 5 * i + 4; 33699566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 5, ij, 5, ij, diag)); 33709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected)); 33717b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3373bbead8a2SBarry Smith diag += 25; 3374bbead8a2SBarry Smith } 3375bbead8a2SBarry Smith break; 3376bbead8a2SBarry Smith case 6: 3377bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33789371c9d4SSatish Balay ij[0] = 6 * i; 33799371c9d4SSatish Balay ij[1] = 6 * i + 1; 33809371c9d4SSatish Balay ij[2] = 6 * i + 2; 33819371c9d4SSatish Balay ij[3] = 6 * i + 3; 33829371c9d4SSatish Balay ij[4] = 6 * i + 4; 33839371c9d4SSatish Balay ij[5] = 6 * i + 5; 33849566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 6, ij, 6, ij, diag)); 33859566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected)); 33867b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33879566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3388bbead8a2SBarry Smith diag += 36; 3389bbead8a2SBarry Smith } 3390bbead8a2SBarry Smith break; 3391bbead8a2SBarry Smith case 7: 3392bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 33939371c9d4SSatish Balay ij[0] = 7 * i; 33949371c9d4SSatish Balay ij[1] = 7 * i + 1; 33959371c9d4SSatish Balay ij[2] = 7 * i + 2; 33969371c9d4SSatish Balay ij[3] = 7 * i + 3; 33979371c9d4SSatish Balay ij[4] = 7 * i + 4; 33989371c9d4SSatish Balay ij[5] = 7 * i + 5; 3399cdd8bf47SJunchao Zhang ij[6] = 7 * i + 6; 34009566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, 7, ij, 7, ij, diag)); 34019566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected)); 34027b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34039566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3404bbead8a2SBarry Smith diag += 49; 3405bbead8a2SBarry Smith } 3406bbead8a2SBarry Smith break; 3407bbead8a2SBarry Smith default: 34089566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ)); 3409bbead8a2SBarry Smith for (i = 0; i < mbs; i++) { 3410ad540459SPierre Jolivet for (j = 0; j < bs; j++) IJ[j] = bs * i + j; 34119566063dSJacob Faibussowitsch PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag)); 34129566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected)); 34137b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34149566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs)); 3415bbead8a2SBarry Smith diag += bs2; 3416bbead8a2SBarry Smith } 34179566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work, v_pivots, IJ)); 3418bbead8a2SBarry Smith } 3419bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 34203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3421bbead8a2SBarry Smith } 3422bbead8a2SBarry Smith 3423d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx) 3424d71ae5a4SJacob Faibussowitsch { 342573a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3426fff043a9SJunchao Zhang PetscScalar a, *aa; 342773a71a0fSBarry Smith PetscInt m, n, i, j, col; 342873a71a0fSBarry Smith 342973a71a0fSBarry Smith PetscFunctionBegin; 343073a71a0fSBarry Smith if (!x->assembled) { 34319566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 343273a71a0fSBarry Smith for (i = 0; i < m; i++) { 343373a71a0fSBarry Smith for (j = 0; j < aij->imax[i]; j++) { 34349566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 343573a71a0fSBarry Smith col = (PetscInt)(n * PetscRealPart(a)); 34369566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 343773a71a0fSBarry Smith } 343873a71a0fSBarry Smith } 3439e2ce353bSJunchao Zhang } else { 34409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x, &aa)); 34419566063dSJacob Faibussowitsch for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i)); 34429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa)); 3443e2ce353bSJunchao Zhang } 34449566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34459566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 344773a71a0fSBarry Smith } 344873a71a0fSBarry Smith 3449679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3450d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx) 3451d71ae5a4SJacob Faibussowitsch { 3452679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data; 3453679944adSJunchao Zhang PetscScalar a; 3454679944adSJunchao Zhang PetscInt m, n, i, j, col, nskip; 3455679944adSJunchao Zhang 3456679944adSJunchao Zhang PetscFunctionBegin; 3457679944adSJunchao Zhang nskip = high - low; 34589566063dSJacob Faibussowitsch PetscCall(MatGetSize(x, &m, &n)); 3459679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3460679944adSJunchao Zhang for (i = 0; i < m; i++) { 3461679944adSJunchao Zhang for (j = 0; j < aij->imax[i]; j++) { 34629566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx, &a)); 3463679944adSJunchao Zhang col = (PetscInt)(n * PetscRealPart(a)); 3464679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34659566063dSJacob Faibussowitsch PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES)); 3466679944adSJunchao Zhang } 3467e2ce353bSJunchao Zhang } 34689566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY)); 34699566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY)); 34703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3471679944adSJunchao Zhang } 3472679944adSJunchao Zhang 34730a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ, 3474cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3475cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3476cb5b572fSBarry Smith MatMult_SeqAIJ, 347797304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34787c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34797c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3480f4259b30SLisandro Dalcin NULL, 3481f4259b30SLisandro Dalcin NULL, 3482f4259b30SLisandro Dalcin NULL, 3483f4259b30SLisandro Dalcin /* 10*/ NULL, 3484cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3485f4259b30SLisandro Dalcin NULL, 348641f059aeSBarry Smith MatSOR_SeqAIJ, 348791e9d3e2SHong Zhang MatTranspose_SeqAIJ, 348897304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3489cb5b572fSBarry Smith MatEqual_SeqAIJ, 3490cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3491cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3492cb5b572fSBarry Smith MatNorm_SeqAIJ, 3493f4259b30SLisandro Dalcin /* 20*/ NULL, 3494cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3495cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3496cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3497d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3498f4259b30SLisandro Dalcin NULL, 3499f4259b30SLisandro Dalcin NULL, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 350226cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 3503f4259b30SLisandro Dalcin NULL, 3504f4259b30SLisandro Dalcin NULL, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3508f4259b30SLisandro Dalcin NULL, 3509f4259b30SLisandro Dalcin NULL, 3510cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3511f4259b30SLisandro Dalcin NULL, 3512d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35137dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3514cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3515cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3516cb5b572fSBarry Smith MatCopy_SeqAIJ, 3517d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3518cb5b572fSBarry Smith MatScale_SeqAIJ, 35197d68702bSBarry Smith MatShift_SeqAIJ, 352079299369SBarry Smith MatDiagonalSet_SeqAIJ, 35216e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352273a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35233b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35243b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35253b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3526a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352793dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3528f4259b30SLisandro Dalcin NULL, 3529f4259b30SLisandro Dalcin NULL, 3530cda55fadSBarry Smith MatPermute_SeqAIJ, 3531f4259b30SLisandro Dalcin NULL, 3532f4259b30SLisandro Dalcin /* 59*/ NULL, 3533b9b97703SBarry Smith MatDestroy_SeqAIJ, 3534b9b97703SBarry Smith MatView_SeqAIJ, 3535f4259b30SLisandro Dalcin NULL, 3536f4259b30SLisandro Dalcin NULL, 3537f4259b30SLisandro Dalcin /* 64*/ NULL, 3538321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3539f4259b30SLisandro Dalcin NULL, 3540f4259b30SLisandro Dalcin NULL, 3541f4259b30SLisandro Dalcin NULL, 3542d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3543c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3544f4259b30SLisandro Dalcin NULL, 3545f4259b30SLisandro Dalcin NULL, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin /* 74*/ NULL, 35483acb8795SBarry Smith MatFDColoringApply_AIJ, 3549f4259b30SLisandro Dalcin NULL, 3550f4259b30SLisandro Dalcin NULL, 3551f4259b30SLisandro Dalcin NULL, 35526ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3553f4259b30SLisandro Dalcin NULL, 3554f4259b30SLisandro Dalcin NULL, 3555f4259b30SLisandro Dalcin NULL, 3556bc011b1eSHong Zhang MatLoad_SeqAIJ, 3557d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35581cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3559f4259b30SLisandro Dalcin NULL, 3560f4259b30SLisandro Dalcin NULL, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin /* 89*/ NULL, 3563f4259b30SLisandro Dalcin NULL, 356426be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3565f4259b30SLisandro Dalcin NULL, 3566f4259b30SLisandro Dalcin NULL, 35678fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3568f4259b30SLisandro Dalcin NULL, 3569f4259b30SLisandro Dalcin NULL, 35706fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3571f4259b30SLisandro Dalcin NULL, 35724222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 3574f4259b30SLisandro Dalcin NULL, 357587d4246cSBarry Smith MatConjugate_SeqAIJ, 3576f4259b30SLisandro Dalcin NULL, 3577d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 357899cafbc1SBarry Smith MatRealPart_SeqAIJ, 3579f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3580f4259b30SLisandro Dalcin NULL, 3581f4259b30SLisandro Dalcin NULL, 3582cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3583f4259b30SLisandro Dalcin NULL, 35842af78befSBarry Smith MatGetRowMin_SeqAIJ, 3585f4259b30SLisandro Dalcin NULL, 3586599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3587f4259b30SLisandro Dalcin /*114*/ NULL, 3588f4259b30SLisandro Dalcin NULL, 3589f4259b30SLisandro Dalcin NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin NULL, 3592f4259b30SLisandro Dalcin /*119*/ NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin NULL, 3595f4259b30SLisandro Dalcin NULL, 3596b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35970716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3598a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 359937868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36000da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3601f4259b30SLisandro Dalcin NULL, 3602f4259b30SLisandro Dalcin /*129*/ NULL, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin NULL, 360575648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3606b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3607b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36082b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3609f4259b30SLisandro Dalcin NULL, 3610f4259b30SLisandro Dalcin NULL, 36113964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3612f4259b30SLisandro Dalcin /*139*/ NULL, 3613f4259b30SLisandro Dalcin NULL, 3614f4259b30SLisandro Dalcin NULL, 36153a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36169c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36174222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36184222ddf1SHong Zhang /*145*/ MatDestroySubMatrices_SeqAIJ, 3619f4259b30SLisandro Dalcin NULL, 362072833a62Smarkadams4 NULL, 362172833a62Smarkadams4 MatCreateGraph_Simple_AIJ, 36222d776b49SBarry Smith NULL, 3623dec0b466SHong Zhang /*150*/ MatTransposeSymbolic_SeqAIJ, 3624dec0b466SHong Zhang MatEliminateZeros_SeqAIJ}; 362517ab2063SBarry Smith 3626ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices) 3627d71ae5a4SJacob Faibussowitsch { 3628bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 362997f1f81fSBarry Smith PetscInt i, nz, n; 3630bef8e0ddSBarry Smith 3631bef8e0ddSBarry Smith PetscFunctionBegin; 3632bef8e0ddSBarry Smith nz = aij->maxnz; 3633d0f46423SBarry Smith n = mat->rmap->n; 3634ad540459SPierre Jolivet for (i = 0; i < nz; i++) aij->j[i] = indices[i]; 3635bef8e0ddSBarry Smith aij->nz = nz; 3636ad540459SPierre Jolivet for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i]; 36373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3638bef8e0ddSBarry Smith } 3639bef8e0ddSBarry Smith 3640a3bb6f32SFande Kong /* 3641ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3642ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3643ddea5d60SJunchao Zhang */ 3644d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3645d71ae5a4SJacob Faibussowitsch { 3646a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3647eec179cfSJacob Faibussowitsch PetscHMapI gid1_lid1; 3648eec179cfSJacob Faibussowitsch PetscHashIter tpos; 364925b670f0SStefano Zampini PetscInt gid, lid, i, ec, nz = aij->nz; 365025b670f0SStefano Zampini PetscInt *garray, *jj = aij->j; 3651a3bb6f32SFande Kong 3652a3bb6f32SFande Kong PetscFunctionBegin; 3653a3bb6f32SFande Kong PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 36544f572ea9SToby Isaac PetscAssertPointer(mapping, 2); 3655a3bb6f32SFande Kong /* use a table */ 3656eec179cfSJacob Faibussowitsch PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1)); 3657a3bb6f32SFande Kong ec = 0; 365825b670f0SStefano Zampini for (i = 0; i < nz; i++) { 365925b670f0SStefano Zampini PetscInt data, gid1 = jj[i] + 1; 3660eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data)); 3661a3bb6f32SFande Kong if (!data) { 3662a3bb6f32SFande Kong /* one based table */ 3663c76ffc5fSJacob Faibussowitsch PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec)); 3664a3bb6f32SFande Kong } 3665a3bb6f32SFande Kong } 3666a3bb6f32SFande Kong /* form array of columns we need */ 36679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec, &garray)); 3668eec179cfSJacob Faibussowitsch PetscHashIterBegin(gid1_lid1, tpos); 3669eec179cfSJacob Faibussowitsch while (!PetscHashIterAtEnd(gid1_lid1, tpos)) { 3670eec179cfSJacob Faibussowitsch PetscHashIterGetKey(gid1_lid1, tpos, gid); 3671eec179cfSJacob Faibussowitsch PetscHashIterGetVal(gid1_lid1, tpos, lid); 3672eec179cfSJacob Faibussowitsch PetscHashIterNext(gid1_lid1, tpos); 3673a3bb6f32SFande Kong gid--; 3674a3bb6f32SFande Kong lid--; 3675a3bb6f32SFande Kong garray[lid] = gid; 3676a3bb6f32SFande Kong } 36779566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */ 3678eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIClear(gid1_lid1)); 3679c76ffc5fSJacob Faibussowitsch for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1)); 3680a3bb6f32SFande Kong /* compact out the extra columns in B */ 368125b670f0SStefano Zampini for (i = 0; i < nz; i++) { 368225b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 3683eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid)); 3684a3bb6f32SFande Kong lid--; 368525b670f0SStefano Zampini jj[i] = lid; 3686a3bb6f32SFande Kong } 36879566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 3688eec179cfSJacob Faibussowitsch PetscCall(PetscHMapIDestroy(&gid1_lid1)); 36899566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap)); 36909566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping)); 36919566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH)); 36923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3693a3bb6f32SFande Kong } 3694a3bb6f32SFande Kong 3695bef8e0ddSBarry Smith /*@ 3696bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3697bef8e0ddSBarry Smith in the matrix. 3698bef8e0ddSBarry Smith 3699bef8e0ddSBarry Smith Input Parameters: 370011a5261eSBarry Smith + mat - the `MATSEQAIJ` matrix 3701bef8e0ddSBarry Smith - indices - the column indices 3702bef8e0ddSBarry Smith 370315091d37SBarry Smith Level: advanced 370415091d37SBarry Smith 3705bef8e0ddSBarry Smith Notes: 3706bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3707bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 370811a5261eSBarry Smith of the `MatSetValues()` operation. 3709bef8e0ddSBarry Smith 3710bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 371111a5261eSBarry Smith `MatCreateSeqAIJ()`, and the columns indices MUST be sorted. 3712bef8e0ddSBarry Smith 371311a5261eSBarry Smith MUST be called before any calls to `MatSetValues()` 3714bef8e0ddSBarry Smith 3715b9617806SBarry Smith The indices should start with zero, not one. 3716b9617806SBarry Smith 37171cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ` 3718bef8e0ddSBarry Smith @*/ 3719d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices) 3720d71ae5a4SJacob Faibussowitsch { 3721bef8e0ddSBarry Smith PetscFunctionBegin; 37220700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 37234f572ea9SToby Isaac PetscAssertPointer(indices, 2); 3724cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 37253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3726bef8e0ddSBarry Smith } 3727bef8e0ddSBarry Smith 3728ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3729d71ae5a4SJacob Faibussowitsch { 3730be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3731d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3732be6bf707SBarry Smith 3733be6bf707SBarry Smith PetscFunctionBegin; 373428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3735be6bf707SBarry Smith 3736be6bf707SBarry Smith /* allocate space for values if not already there */ 37374dfa11a4SJacob Faibussowitsch if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); } 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith /* copy values over */ 37409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 37413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3742be6bf707SBarry Smith } 3743be6bf707SBarry Smith 3744be6bf707SBarry Smith /*@ 374520f4b53cSBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the 3746be6bf707SBarry Smith nonlinear portion. 3747be6bf707SBarry Smith 3748c3339decSBarry Smith Logically Collect 3749be6bf707SBarry Smith 375027430b45SBarry Smith Input Parameter: 375111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3752be6bf707SBarry Smith 375315091d37SBarry Smith Level: advanced 375415091d37SBarry Smith 37552920cce0SJacob Faibussowitsch Example Usage: 375627430b45SBarry Smith .vb 37572ef1f0ffSBarry Smith Using SNES 375827430b45SBarry Smith Create Jacobian matrix 375927430b45SBarry Smith Set linear terms into matrix 376027430b45SBarry Smith Apply boundary conditions to matrix, at this time matrix must have 376127430b45SBarry Smith final nonzero structure (i.e. setting the nonlinear terms and applying 376227430b45SBarry Smith boundary conditions again will not change the nonzero structure 376327430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 376427430b45SBarry Smith MatStoreValues(mat); 376527430b45SBarry Smith Call SNESSetJacobian() with matrix 376627430b45SBarry Smith In your Jacobian routine 376727430b45SBarry Smith MatRetrieveValues(mat); 376827430b45SBarry Smith Set nonlinear terms in matrix 3769be6bf707SBarry Smith 377027430b45SBarry Smith Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself: 377127430b45SBarry Smith // build linear portion of Jacobian 377227430b45SBarry Smith MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE); 377327430b45SBarry Smith MatStoreValues(mat); 377427430b45SBarry Smith loop over nonlinear iterations 377527430b45SBarry Smith MatRetrieveValues(mat); 377627430b45SBarry Smith // call MatSetValues(mat,...) to set nonliner portion of Jacobian 377727430b45SBarry Smith // call MatAssemblyBegin/End() on matrix 377827430b45SBarry Smith Solve linear system with Jacobian 377927430b45SBarry Smith endloop 378027430b45SBarry Smith .ve 3781be6bf707SBarry Smith 3782be6bf707SBarry Smith Notes: 3783da81f932SPierre Jolivet Matrix must already be assembled before calling this routine 378411a5261eSBarry Smith Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before 3785be6bf707SBarry Smith calling this routine. 3786be6bf707SBarry Smith 37870c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37880c468ba9SBarry Smith and does not allocated additional space. 37890c468ba9SBarry Smith 3790fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()` 3791be6bf707SBarry Smith @*/ 3792d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat) 3793d71ae5a4SJacob Faibussowitsch { 3794be6bf707SBarry Smith PetscFunctionBegin; 37950700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 379628b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 379728b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3798cac4c232SBarry Smith PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat)); 37993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3800be6bf707SBarry Smith } 3801be6bf707SBarry Smith 3802ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3803d71ae5a4SJacob Faibussowitsch { 3804be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 3805d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3806be6bf707SBarry Smith 3807be6bf707SBarry Smith PetscFunctionBegin; 380828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 380928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 3810be6bf707SBarry Smith /* copy values over */ 38119566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 38123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3813be6bf707SBarry Smith } 3814be6bf707SBarry Smith 3815be6bf707SBarry Smith /*@ 381620f4b53cSBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()` 3817be6bf707SBarry Smith 3818c3339decSBarry Smith Logically Collect 3819be6bf707SBarry Smith 38202fe279fdSBarry Smith Input Parameter: 382111a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option) 3822be6bf707SBarry Smith 382315091d37SBarry Smith Level: advanced 382415091d37SBarry Smith 38251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()` 3826be6bf707SBarry Smith @*/ 3827d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat) 3828d71ae5a4SJacob Faibussowitsch { 3829be6bf707SBarry Smith PetscFunctionBegin; 38300700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 383128b400f6SJacob Faibussowitsch PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 383228b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 3833cac4c232SBarry Smith PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat)); 38343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3835be6bf707SBarry Smith } 3836be6bf707SBarry Smith 383717ab2063SBarry Smith /*@C 383811a5261eSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format 38390d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 384020f4b53cSBarry Smith the user should preallocate the matrix storage by setting the parameter `nz` 384120f4b53cSBarry Smith (or the array `nnz`). 384217ab2063SBarry Smith 3843d083f849SBarry Smith Collective 3844db81eaa0SLois Curfman McInnes 384517ab2063SBarry Smith Input Parameters: 384611a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 384717ab2063SBarry Smith . m - number of rows 384817ab2063SBarry Smith . n - number of columns 384917ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 385051c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38510298fd71SBarry Smith (possibly different for each row) or NULL 385217ab2063SBarry Smith 385317ab2063SBarry Smith Output Parameter: 3854416022c9SBarry Smith . A - the matrix 385517ab2063SBarry Smith 38562ef1f0ffSBarry Smith Options Database Keys: 38572ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 38582ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 38592ef1f0ffSBarry Smith 38602ef1f0ffSBarry Smith Level: intermediate 3861175b88e8SBarry Smith 3862b259b22eSLois Curfman McInnes Notes: 386377433607SBarry Smith It is recommend to use `MatCreateFromOptions()` instead of this routine 386477433607SBarry Smith 38652ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 386649a6f317SBarry Smith 38672ef1f0ffSBarry Smith The `MATSEQAIJ` format, also called 38682ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 38690002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 38702ef1f0ffSBarry Smith either one (as in Fortran) or zero. 387117ab2063SBarry Smith 387220f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 38732ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 387420f4b53cSBarry Smith allocation. 387517ab2063SBarry Smith 3876682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38774fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3878682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38796c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38806c7ebb05SLois Curfman McInnes 38811cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()` 388217ab2063SBarry Smith @*/ 3883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 3884d71ae5a4SJacob Faibussowitsch { 38853a40ed3dSBarry Smith PetscFunctionBegin; 38869566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 38879566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 38889566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQAIJ)); 38899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz)); 38903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3891273d9f13SBarry Smith } 3892273d9f13SBarry Smith 3893273d9f13SBarry Smith /*@C 3894273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3895273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3896273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3897273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3898273d9f13SBarry Smith 3899d083f849SBarry Smith Collective 3900273d9f13SBarry Smith 3901273d9f13SBarry Smith Input Parameters: 39021c4f3114SJed Brown + B - The matrix 3903273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3904273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39050298fd71SBarry Smith (possibly different for each row) or NULL 3906273d9f13SBarry Smith 39072ef1f0ffSBarry Smith Options Database Keys: 39082ef1f0ffSBarry Smith + -mat_no_inode - Do not use inodes 39092ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 39102ef1f0ffSBarry Smith 39112ef1f0ffSBarry Smith Level: intermediate 39122ef1f0ffSBarry Smith 3913273d9f13SBarry Smith Notes: 39142ef1f0ffSBarry Smith If `nnz` is given then `nz` is ignored 391549a6f317SBarry Smith 391611a5261eSBarry Smith The `MATSEQAIJ` format also called 39172ef1f0ffSBarry Smith compressed row storage, is fully compatible with standard Fortran 3918273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3919273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3920273d9f13SBarry Smith 39212ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 39222ef1f0ffSBarry Smith Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 39232ef1f0ffSBarry Smith allocation. 3924273d9f13SBarry Smith 392511a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 3926aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3927aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3928aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3929aa95bbe8SBarry Smith 393011a5261eSBarry Smith Developer Notes: 393111a5261eSBarry Smith Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix 3932a96a251dSBarry Smith entries or columns indices 3933a96a251dSBarry Smith 3934273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3935273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3936273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3937273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3938273d9f13SBarry Smith 39391cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`, 3940db781477SPatrick Sanan `MatSeqAIJSetTotalPreallocation()` 3941273d9f13SBarry Smith @*/ 3942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[]) 3943d71ae5a4SJacob Faibussowitsch { 3944a23d5eceSKris Buschelman PetscFunctionBegin; 39456ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 39466ba663aaSJed Brown PetscValidType(B, 1); 3947cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz)); 39483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 3949a23d5eceSKris Buschelman } 3950a23d5eceSKris Buschelman 3951d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz) 3952d71ae5a4SJacob Faibussowitsch { 3953ad79cf63SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 39542576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE; 395597f1f81fSBarry Smith PetscInt i; 3956273d9f13SBarry Smith 3957273d9f13SBarry Smith PetscFunctionBegin; 3958ad79cf63SBarry Smith if (B->hash_active) { 3959aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 3960ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 3961ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 3962ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 3963ad79cf63SBarry Smith } 39642576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3965a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3966c461c341SBarry Smith skipallocation = PETSC_TRUE; 3967c461c341SBarry Smith nz = 0; 3968c461c341SBarry Smith } 39699566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39709566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3971899cda47SBarry Smith 3972435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 397308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 3974cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3975d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) { 397608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 397708401ef6SPierre Jolivet PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n); 3978b73539f3SBarry Smith } 3979b73539f3SBarry Smith } 3980b73539f3SBarry Smith 3981273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 3982ab93d7beSBarry Smith if (!skipallocation) { 39834dfa11a4SJacob Faibussowitsch if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); } 3984071fcb05SBarry Smith if (!b->ilen) { 3985071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 39869566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n, &b->ilen)); 3987071fcb05SBarry Smith } else { 39889566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt))); 39892ee49352SLisandro Dalcin } 3990aa624791SPierre Jolivet if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); 3991273d9f13SBarry Smith if (!nnz) { 3992435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3993c62bd62aSJed Brown else if (nz < 0) nz = 1; 39945d2a9ed1SStefano Zampini nz = PetscMin(nz, B->cmap->n); 3995d0f46423SBarry Smith for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz; 3996c43c4a61SBarry Smith PetscCall(PetscIntMultError(nz, B->rmap->n, &nz)); 3997273d9f13SBarry Smith } else { 3998c73702f5SBarry Smith PetscInt64 nz64 = 0; 39999371c9d4SSatish Balay for (i = 0; i < B->rmap->n; i++) { 40009371c9d4SSatish Balay b->imax[i] = nnz[i]; 40019371c9d4SSatish Balay nz64 += nnz[i]; 40029371c9d4SSatish Balay } 40039566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 4004273d9f13SBarry Smith } 4005ab93d7beSBarry Smith 4006273d9f13SBarry Smith /* allocate the matrix space */ 400753dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40089566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 4009396832f4SHong Zhang if (B->structure_only) { 40109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &b->j)); 40119566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i)); 4012396832f4SHong Zhang } else { 40139566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i)); 4014396832f4SHong Zhang } 4015bfeeae90SHong Zhang b->i[0] = 0; 4016ad540459SPierre Jolivet for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 4017396832f4SHong Zhang if (B->structure_only) { 4018396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4019396832f4SHong Zhang b->free_a = PETSC_FALSE; 4020396832f4SHong Zhang } else { 4021273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4022e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4023396832f4SHong Zhang } 4024e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4025c461c341SBarry Smith } else { 4026e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4027e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4028c461c341SBarry Smith } 4029273d9f13SBarry Smith 4030846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4031846b4da1SFande Kong /* reserve user-requested sparsity */ 40329566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n)); 4033846b4da1SFande Kong } 4034846b4da1SFande Kong 4035273d9f13SBarry Smith b->nz = 0; 4036273d9f13SBarry Smith b->maxnz = nz; 4037273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40381baa6e33SBarry Smith if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 4039cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4040cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 40415519a089SJose E. Roman /* We simply deem preallocation has changed nonzero state. Updating the state 40425519a089SJose E. Roman will give clients (like AIJKokkos) a chance to know something has happened. 40435519a089SJose E. Roman */ 40445519a089SJose E. Roman B->nonzerostate++; 40453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4046273d9f13SBarry Smith } 4047273d9f13SBarry Smith 4048ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4049d71ae5a4SJacob Faibussowitsch { 4050846b4da1SFande Kong Mat_SeqAIJ *a; 4051a5bbaf83SFande Kong PetscInt i; 40521f14be2bSBarry Smith PetscBool skipreset; 4053846b4da1SFande Kong 4054846b4da1SFande Kong PetscFunctionBegin; 4055846b4da1SFande Kong PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 405614d0e64fSAlex Lindsay 405714d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 40583ba16761SJacob Faibussowitsch if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS); 405914d0e64fSAlex Lindsay 4060846b4da1SFande Kong a = (Mat_SeqAIJ *)A->data; 40612c814fdeSFande Kong /* if no saved info, we error out */ 406228b400f6SJacob Faibussowitsch PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info "); 40632c814fdeSFande Kong 40641f14be2bSBarry Smith PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation "); 40652c814fdeSFande Kong 40661f14be2bSBarry Smith PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset)); 40671f14be2bSBarry Smith if (!skipreset) { 40689566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n)); 40699566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen, A->rmap->n)); 4070846b4da1SFande Kong a->i[0] = 0; 4071ad540459SPierre Jolivet for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1]; 4072846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4073846b4da1SFande Kong a->nz = 0; 4074846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4075846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4076846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4077846b4da1SFande Kong A->assembled = PETSC_FALSE; 40781f14be2bSBarry Smith } 40793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4080846b4da1SFande Kong } 4081846b4da1SFande Kong 408258d36128SBarry Smith /*@ 408311a5261eSBarry Smith MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format. 4084a1661176SMatthew Knepley 4085a1661176SMatthew Knepley Input Parameters: 4086a1661176SMatthew Knepley + B - the matrix 4087a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4088a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4089a1661176SMatthew Knepley - v - optional values in the matrix 4090a1661176SMatthew Knepley 4091a1661176SMatthew Knepley Level: developer 4092a1661176SMatthew Knepley 40936a9b8d82SBarry Smith Notes: 40942ef1f0ffSBarry Smith The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()` 409558d36128SBarry Smith 40966a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 40976a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 40986a9b8d82SBarry Smith 40996a9b8d82SBarry Smith Developer Notes: 41002ef1f0ffSBarry Smith An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and 41012ef1f0ffSBarry Smith then just copies the `v` values directly with `PetscMemcpy()`. 41026a9b8d82SBarry Smith 410311a5261eSBarry Smith This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them. 41046a9b8d82SBarry Smith 4105fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()` 4106a1661176SMatthew Knepley @*/ 4107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 4108d71ae5a4SJacob Faibussowitsch { 4109a1661176SMatthew Knepley PetscFunctionBegin; 41100700a824SBarry Smith PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 41116ba663aaSJed Brown PetscValidType(B, 1); 4112cac4c232SBarry Smith PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v)); 41133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4114a1661176SMatthew Knepley } 4115a1661176SMatthew Knepley 4116ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[]) 4117d71ae5a4SJacob Faibussowitsch { 4118a1661176SMatthew Knepley PetscInt i; 4119a1661176SMatthew Knepley PetscInt m, n; 4120a1661176SMatthew Knepley PetscInt nz; 41216a9b8d82SBarry Smith PetscInt *nnz; 4122a1661176SMatthew Knepley 4123a1661176SMatthew Knepley PetscFunctionBegin; 4124aed4548fSBarry Smith PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4125779a8d59SSatish Balay 41269566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4128779a8d59SSatish Balay 41299566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41309566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 4131a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4132b7940d39SSatish Balay nz = Ii[i + 1] - Ii[i]; 413308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4134a1661176SMatthew Knepley nnz[i] = nz; 4135a1661176SMatthew Knepley } 41369566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41379566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4138a1661176SMatthew Knepley 4139*8e3a54c0SPierre Jolivet for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES)); 4140a1661176SMatthew Knepley 41419566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 41429566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 4143a1661176SMatthew Knepley 41449566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 41453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4146a1661176SMatthew Knepley } 4147a1661176SMatthew Knepley 4148ad7e164aSPierre Jolivet /*@ 41492ef1f0ffSBarry Smith MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`. 4150ad7e164aSPierre Jolivet 4151ad7e164aSPierre Jolivet Input Parameters: 4152ad7e164aSPierre Jolivet + A - left-hand side matrix 4153ad7e164aSPierre Jolivet . B - right-hand side matrix 415411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX` 4155ad7e164aSPierre Jolivet 4156ad7e164aSPierre Jolivet Output Parameter: 41572ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B` 4158ad7e164aSPierre Jolivet 4159ad7e164aSPierre Jolivet Level: intermediate 4160ad7e164aSPierre Jolivet 416111a5261eSBarry Smith Note: 416211a5261eSBarry Smith `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`. 4163ad7e164aSPierre Jolivet 41641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse` 4165ad7e164aSPierre Jolivet @*/ 4166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C) 4167d71ae5a4SJacob Faibussowitsch { 4168ad7e164aSPierre Jolivet PetscFunctionBegin; 4169ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A, MAT_CLASSID, 1); 4170ad7e164aSPierre Jolivet PetscValidType(A, 1); 4171ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B, MAT_CLASSID, 2); 4172ad7e164aSPierre Jolivet PetscValidType(B, 2); 41734f572ea9SToby Isaac PetscAssertPointer(C, 4); 4174ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4175ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C, MAT_CLASSID, 4); 4176ad7e164aSPierre Jolivet PetscValidType(*C, 4); 4177ad7e164aSPierre Jolivet } 4178cac4c232SBarry Smith PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C)); 41793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4180ad7e164aSPierre Jolivet } 4181ad7e164aSPierre Jolivet 4182ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C) 4183d71ae5a4SJacob Faibussowitsch { 4184ad7e164aSPierre Jolivet Mat newmat; 4185ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 4186ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ *)B->data; 4187ad7e164aSPierre Jolivet PetscScalar *v; 4188fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 4189ad7e164aSPierre Jolivet PetscInt *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n; 4190ad7e164aSPierre Jolivet PetscBool flg; 4191ad7e164aSPierre Jolivet 4192ad7e164aSPierre Jolivet PetscFunctionBegin; 419328b400f6SJacob Faibussowitsch PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419428b400f6SJacob Faibussowitsch PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 419528b400f6SJacob Faibussowitsch PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix"); 419628b400f6SJacob Faibussowitsch PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix"); 41979566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg)); 419828b400f6SJacob Faibussowitsch PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name); 4199aed4548fSBarry Smith PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse); 4200ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42019566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j)); 42029566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF, &newmat)); 42039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn)); 42049566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat, MATAIJ)); 4205ad7e164aSPierre Jolivet i[0] = 0; 4206ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4207ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4208ad7e164aSPierre Jolivet i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]); 4209ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4210ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q]; 4211ad7e164aSPierre Jolivet } 4212ad7e164aSPierre Jolivet } 4213ad7e164aSPierre Jolivet } 42149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL)); 4215ad7e164aSPierre Jolivet *C = newmat; 42169566063dSJacob Faibussowitsch PetscCall(PetscFree2(i, j)); 4217ad7e164aSPierre Jolivet nnz = 0; 4218ad7e164aSPierre Jolivet } 42199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C, &v)); 42209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 42219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 4222ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4223ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4224ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m + 1]; ++n) { 4225ad540459SPierre Jolivet for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q]; 4226ad7e164aSPierre Jolivet } 4227ad7e164aSPierre Jolivet } 4228ad7e164aSPierre Jolivet } 42299566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C, &v)); 42309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 42319566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 42323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4233ad7e164aSPierre Jolivet } 4234ad7e164aSPierre Jolivet 4235c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4236af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4237170fe5c8SBarry Smith 4238170fe5c8SBarry Smith /* 4239170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4240170fe5c8SBarry Smith 4241170fe5c8SBarry Smith n p p 42422da392ccSBarry Smith [ ] [ ] [ ] 42432da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42442da392ccSBarry Smith [ ] [ ] [ ] 4245170fe5c8SBarry Smith 4246170fe5c8SBarry Smith */ 4247d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C) 4248d71ae5a4SJacob Faibussowitsch { 4249170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense *)A->data; 4250170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ *)B->data; 4251170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense *)C->data; 425286214ceeSStefano Zampini PetscInt i, j, n, m, q, p; 4253170fe5c8SBarry Smith const PetscInt *ii, *idx; 4254170fe5c8SBarry Smith const PetscScalar *b, *a, *a_q; 4255170fe5c8SBarry Smith PetscScalar *c, *c_q; 425686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 425786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4258170fe5c8SBarry Smith 4259170fe5c8SBarry Smith PetscFunctionBegin; 4260d0f46423SBarry Smith m = A->rmap->n; 4261d0f46423SBarry Smith n = A->cmap->n; 4262d0f46423SBarry Smith p = B->cmap->n; 4263170fe5c8SBarry Smith a = sub_a->v; 4264170fe5c8SBarry Smith b = sub_b->a; 4265170fe5c8SBarry Smith c = sub_c->v; 426686214ceeSStefano Zampini if (clda == m) { 42679566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c, m * p)); 426886214ceeSStefano Zampini } else { 426986214ceeSStefano Zampini for (j = 0; j < p; j++) 42709371c9d4SSatish Balay for (i = 0; i < m; i++) c[j * clda + i] = 0.0; 427186214ceeSStefano Zampini } 4272170fe5c8SBarry Smith ii = sub_b->i; 4273170fe5c8SBarry Smith idx = sub_b->j; 4274170fe5c8SBarry Smith for (i = 0; i < n; i++) { 4275170fe5c8SBarry Smith q = ii[i + 1] - ii[i]; 4276170fe5c8SBarry Smith while (q-- > 0) { 427786214ceeSStefano Zampini c_q = c + clda * (*idx); 427886214ceeSStefano Zampini a_q = a + alda * i; 4279854c7f52SBarry Smith PetscKernelAXPY(c_q, *b, a_q, m); 4280170fe5c8SBarry Smith idx++; 4281170fe5c8SBarry Smith b++; 4282170fe5c8SBarry Smith } 4283170fe5c8SBarry Smith } 42843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4285170fe5c8SBarry Smith } 4286170fe5c8SBarry Smith 4287d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C) 4288d71ae5a4SJacob Faibussowitsch { 4289d0f46423SBarry Smith PetscInt m = A->rmap->n, n = B->cmap->n; 429086214ceeSStefano Zampini PetscBool cisdense; 4291170fe5c8SBarry Smith 4292170fe5c8SBarry Smith PetscFunctionBegin; 429308401ef6SPierre Jolivet PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n); 42949566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, m, n, m, n)); 42959566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, B)); 4296d5e393b6SSuyash Tandon PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, "")); 429748a46eb9SPierre Jolivet if (!cisdense) PetscCall(MatSetType(C, MATDENSE)); 42989566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4299d73949e8SHong Zhang 43004222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 43013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4302170fe5c8SBarry Smith } 4303170fe5c8SBarry Smith 43040bad9183SKris Buschelman /*MC 4305fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43060bad9183SKris Buschelman based on compressed sparse row format. 43070bad9183SKris Buschelman 43082ef1f0ffSBarry Smith Options Database Key: 43090bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43100bad9183SKris Buschelman 43110bad9183SKris Buschelman Level: beginner 43120bad9183SKris Buschelman 43130cd7f59aSBarry Smith Notes: 43142ef1f0ffSBarry Smith `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values, 43150cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43160cd7f59aSBarry Smith in the matrix 43170cd7f59aSBarry Smith 431811a5261eSBarry Smith `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no 431911a5261eSBarry Smith space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored 43200cd7f59aSBarry Smith 432111a5261eSBarry Smith Developer Note: 43222ef1f0ffSBarry Smith It would be nice if all matrix formats supported passing `NULL` in for the numerical values 43230cd7f59aSBarry Smith 43241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 43250bad9183SKris Buschelman M*/ 43260bad9183SKris Buschelman 4327ccd284c7SBarry Smith /*MC 4328ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4329ccd284c7SBarry Smith 433011a5261eSBarry Smith This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator, 433111a5261eSBarry Smith and `MATMPIAIJ` otherwise. As a result, for single process communicators, 433211a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4333ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4334ccd284c7SBarry Smith the above preallocation routines for simplicity. 4335ccd284c7SBarry Smith 43362ef1f0ffSBarry Smith Options Database Key: 433711a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()` 4338ccd284c7SBarry Smith 43392ef1f0ffSBarry Smith Level: beginner 43402ef1f0ffSBarry Smith 434111a5261eSBarry Smith Note: 434211a5261eSBarry Smith Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when 4343ccd284c7SBarry Smith enough exist. 4344ccd284c7SBarry Smith 43451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL` 4346ccd284c7SBarry Smith M*/ 4347ccd284c7SBarry Smith 4348ccd284c7SBarry Smith /*MC 4349ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4350ccd284c7SBarry Smith 43512ef1f0ffSBarry Smith Options Database Key: 43522ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()` 43532ef1f0ffSBarry Smith 43542ef1f0ffSBarry Smith Level: beginner 43552ef1f0ffSBarry Smith 43562ef1f0ffSBarry Smith Note: 435711a5261eSBarry Smith This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator, 435811a5261eSBarry Smith and `MATMPIAIJCRL` otherwise. As a result, for single process communicators, 435911a5261eSBarry Smith `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported 4360ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4361ccd284c7SBarry Smith the above preallocation routines for simplicity. 4362ccd284c7SBarry Smith 43631cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL` 4364ccd284c7SBarry Smith M*/ 4365ccd284c7SBarry Smith 43667906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *); 43677906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43687906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 43697906f579SHong Zhang #endif 4370d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4371d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 4372d24d4204SJose E. Roman #endif 43737906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 43747906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *); 43757906f579SHong Zhang #endif 43767906f579SHong Zhang 4377d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *); 4378c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *); 43794222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 43807906f579SHong Zhang 43818c778c55SBarry Smith /*@C 438211a5261eSBarry Smith MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored 43838c778c55SBarry Smith 43848c778c55SBarry Smith Not Collective 43858c778c55SBarry Smith 43868c778c55SBarry Smith Input Parameter: 4387fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 43888c778c55SBarry Smith 43898c778c55SBarry Smith Output Parameter: 43908c778c55SBarry Smith . array - pointer to the data 43918c778c55SBarry Smith 43928c778c55SBarry Smith Level: intermediate 43938c778c55SBarry Smith 4394fe59aa6dSJacob Faibussowitsch Fortran Notes: 43950ab4885dSBarry Smith `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()` 43960ab4885dSBarry Smith 43971cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 43988c778c55SBarry Smith @*/ 4399d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array) 4400d71ae5a4SJacob Faibussowitsch { 4401d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44028c778c55SBarry Smith 44038c778c55SBarry Smith PetscFunctionBegin; 4404d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44059566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A, array)); 4406d67d9f35SJunchao Zhang } else { 4407d67d9f35SJunchao Zhang *array = aij->a; 4408d67d9f35SJunchao Zhang } 44093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4410d67d9f35SJunchao Zhang } 4411d67d9f35SJunchao Zhang 4412d67d9f35SJunchao Zhang /*@C 441311a5261eSBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()` 4414d67d9f35SJunchao Zhang 4415d67d9f35SJunchao Zhang Not Collective 4416d67d9f35SJunchao Zhang 4417d67d9f35SJunchao Zhang Input Parameters: 4418fe59aa6dSJacob Faibussowitsch + A - a `MATSEQAIJ` matrix 4419d67d9f35SJunchao Zhang - array - pointer to the data 4420d67d9f35SJunchao Zhang 4421d67d9f35SJunchao Zhang Level: intermediate 4422d67d9f35SJunchao Zhang 4423fe59aa6dSJacob Faibussowitsch Fortran Notes: 44240ab4885dSBarry Smith `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()` 44250ab4885dSBarry Smith 44261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()` 4427d67d9f35SJunchao Zhang @*/ 4428d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array) 4429d71ae5a4SJacob Faibussowitsch { 4430d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4431d67d9f35SJunchao Zhang 4432d67d9f35SJunchao Zhang PetscFunctionBegin; 4433d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44349566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A, array)); 4435d67d9f35SJunchao Zhang } else { 4436d67d9f35SJunchao Zhang *array = NULL; 4437d67d9f35SJunchao Zhang } 44389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44399566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44418c778c55SBarry Smith } 44428c778c55SBarry Smith 444321e72a00SBarry Smith /*@C 444411a5261eSBarry Smith MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored 44458f1ea47aSStefano Zampini 44460ab4885dSBarry Smith Not Collective; No Fortran Support 44478f1ea47aSStefano Zampini 44488f1ea47aSStefano Zampini Input Parameter: 4449fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44508f1ea47aSStefano Zampini 44518f1ea47aSStefano Zampini Output Parameter: 44528f1ea47aSStefano Zampini . array - pointer to the data 44538f1ea47aSStefano Zampini 44548f1ea47aSStefano Zampini Level: intermediate 44558f1ea47aSStefano Zampini 44561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 44578f1ea47aSStefano Zampini @*/ 4458d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array) 4459d71ae5a4SJacob Faibussowitsch { 4460d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44618f1ea47aSStefano Zampini 44628f1ea47aSStefano Zampini PetscFunctionBegin; 4463d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44649566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A, array)); 4465d67d9f35SJunchao Zhang } else { 4466d67d9f35SJunchao Zhang *array = aij->a; 4467d67d9f35SJunchao Zhang } 44683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44698f1ea47aSStefano Zampini } 44708f1ea47aSStefano Zampini 44718f1ea47aSStefano Zampini /*@C 447211a5261eSBarry Smith MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()` 44738f1ea47aSStefano Zampini 44740ab4885dSBarry Smith Not Collective; No Fortran Support 44758f1ea47aSStefano Zampini 44768f1ea47aSStefano Zampini Input Parameter: 4477fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 44788f1ea47aSStefano Zampini 44798f1ea47aSStefano Zampini Output Parameter: 44808f1ea47aSStefano Zampini . array - pointer to the data 44818f1ea47aSStefano Zampini 44828f1ea47aSStefano Zampini Level: intermediate 44838f1ea47aSStefano Zampini 44841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 44858f1ea47aSStefano Zampini @*/ 4486d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array) 4487d71ae5a4SJacob Faibussowitsch { 4488d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 44898f1ea47aSStefano Zampini 44908f1ea47aSStefano Zampini PetscFunctionBegin; 4491d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 44929566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A, array)); 4493d67d9f35SJunchao Zhang } else { 4494d67d9f35SJunchao Zhang *array = NULL; 4495d67d9f35SJunchao Zhang } 44963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4497d67d9f35SJunchao Zhang } 4498d67d9f35SJunchao Zhang 4499d67d9f35SJunchao Zhang /*@C 450011a5261eSBarry Smith MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored 4501d67d9f35SJunchao Zhang 45020ab4885dSBarry Smith Not Collective; No Fortran Support 4503d67d9f35SJunchao Zhang 4504d67d9f35SJunchao Zhang Input Parameter: 4505fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 4506d67d9f35SJunchao Zhang 4507d67d9f35SJunchao Zhang Output Parameter: 4508d67d9f35SJunchao Zhang . array - pointer to the data 4509d67d9f35SJunchao Zhang 4510d67d9f35SJunchao Zhang Level: intermediate 4511d67d9f35SJunchao Zhang 45121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()` 4513d67d9f35SJunchao Zhang @*/ 4514d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array) 4515d71ae5a4SJacob Faibussowitsch { 4516d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4517d67d9f35SJunchao Zhang 4518d67d9f35SJunchao Zhang PetscFunctionBegin; 4519d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45209566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A, array)); 4521d67d9f35SJunchao Zhang } else { 4522d67d9f35SJunchao Zhang *array = aij->a; 4523d67d9f35SJunchao Zhang } 45249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45259566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 45263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4527d67d9f35SJunchao Zhang } 4528d67d9f35SJunchao Zhang 4529d67d9f35SJunchao Zhang /*@C 4530d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4531d67d9f35SJunchao Zhang 45320ab4885dSBarry Smith Not Collective; No Fortran Support 4533d67d9f35SJunchao Zhang 4534d67d9f35SJunchao Zhang Input Parameter: 4535fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix 4536d67d9f35SJunchao Zhang 4537d67d9f35SJunchao Zhang Output Parameter: 4538d67d9f35SJunchao Zhang . array - pointer to the data 4539d67d9f35SJunchao Zhang 4540d67d9f35SJunchao Zhang Level: intermediate 4541d67d9f35SJunchao Zhang 45421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 4543d67d9f35SJunchao Zhang @*/ 4544d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array) 4545d71ae5a4SJacob Faibussowitsch { 4546d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 4547d67d9f35SJunchao Zhang 4548d67d9f35SJunchao Zhang PetscFunctionBegin; 4549d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45509566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A, array)); 4551d67d9f35SJunchao Zhang } else { 4552d67d9f35SJunchao Zhang *array = NULL; 4553d67d9f35SJunchao Zhang } 45543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45558f1ea47aSStefano Zampini } 45568f1ea47aSStefano Zampini 45578f1ea47aSStefano Zampini /*@C 455811a5261eSBarry Smith MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix 45597ee59b9bSJunchao Zhang 45600ab4885dSBarry Smith Not Collective; No Fortran Support 45617ee59b9bSJunchao Zhang 45627ee59b9bSJunchao Zhang Input Parameter: 456311a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses 45647ee59b9bSJunchao Zhang 45657ee59b9bSJunchao Zhang Output Parameters: 45667ee59b9bSJunchao Zhang + i - row map array of the matrix 45677ee59b9bSJunchao Zhang . j - column index array of the matrix 45687ee59b9bSJunchao Zhang . a - data array of the matrix 4569fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays 45707ee59b9bSJunchao Zhang 4571fe59aa6dSJacob Faibussowitsch Level: developer 45722ef1f0ffSBarry Smith 45737ee59b9bSJunchao Zhang Notes: 45742ef1f0ffSBarry Smith Any of the output parameters can be `NULL`, in which case the corresponding value is not returned. 45757ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45767ee59b9bSJunchao Zhang 45777ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45782ef1f0ffSBarry Smith If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix. 45797ee59b9bSJunchao Zhang 45801cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()` 45817ee59b9bSJunchao Zhang @*/ 4582d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype) 4583d71ae5a4SJacob Faibussowitsch { 45847ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data; 45857ee59b9bSJunchao Zhang 45867ee59b9bSJunchao Zhang PetscFunctionBegin; 45877ee59b9bSJunchao Zhang PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated"); 45887ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 45897ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype)); 45907ee59b9bSJunchao Zhang } else { 45917ee59b9bSJunchao Zhang if (i) *i = aij->i; 45927ee59b9bSJunchao Zhang if (j) *j = aij->j; 45937ee59b9bSJunchao Zhang if (a) *a = aij->a; 45947ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 45957ee59b9bSJunchao Zhang } 45963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45977ee59b9bSJunchao Zhang } 45987ee59b9bSJunchao Zhang 45997ee59b9bSJunchao Zhang /*@C 460021e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 460121e72a00SBarry Smith 460221e72a00SBarry Smith Not Collective 460321e72a00SBarry Smith 460421e72a00SBarry Smith Input Parameter: 4605fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix 460621e72a00SBarry Smith 460721e72a00SBarry Smith Output Parameter: 460821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 460921e72a00SBarry Smith 461021e72a00SBarry Smith Level: intermediate 461121e72a00SBarry Smith 46121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()` 461321e72a00SBarry Smith @*/ 4614d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz) 4615d71ae5a4SJacob Faibussowitsch { 461621e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data; 461721e72a00SBarry Smith 461821e72a00SBarry Smith PetscFunctionBegin; 461921e72a00SBarry Smith *nz = aij->rmax; 46203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 462121e72a00SBarry Smith } 462221e72a00SBarry Smith 46232c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data) 46242c4ab24aSJunchao Zhang { 46252c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data; 46262c4ab24aSJunchao Zhang PetscFunctionBegin; 46272c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->perm)); 46282c4ab24aSJunchao Zhang PetscCall(PetscFree(coo->jmap)); 46292c4ab24aSJunchao Zhang PetscCall(PetscFree(coo)); 46302c4ab24aSJunchao Zhang PetscFunctionReturn(PETSC_SUCCESS); 46312c4ab24aSJunchao Zhang } 46322c4ab24aSJunchao Zhang 4633d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[]) 4634d71ae5a4SJacob Faibussowitsch { 4635394ed5ebSJunchao Zhang MPI_Comm comm; 4636394ed5ebSJunchao Zhang PetscInt *i, *j; 4637394ed5ebSJunchao Zhang PetscInt M, N, row; 4638394ed5ebSJunchao Zhang PetscCount k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */ 4639394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4640394ed5ebSJunchao Zhang PetscInt *Aj; 4641394ed5ebSJunchao Zhang PetscScalar *Aa; 4642cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ *)(mat->data); 4643cbc6b225SStefano Zampini MatType rtype; 4644394ed5ebSJunchao Zhang PetscCount *perm, *jmap; 46452c4ab24aSJunchao Zhang PetscContainer container; 46462c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4647394ed5ebSJunchao Zhang 4648394ed5ebSJunchao Zhang PetscFunctionBegin; 46499566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat, &comm)); 46509566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &M, &N)); 4651e8729f6fSJunchao Zhang i = coo_i; 4652e8729f6fSJunchao Zhang j = coo_j; 46539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n, &perm)); 4654394ed5ebSJunchao Zhang for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */ 4655394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4656394ed5ebSJunchao Zhang perm[k] = k; 4657394ed5ebSJunchao Zhang } 4658394ed5ebSJunchao Zhang 4659394ed5ebSJunchao Zhang /* Sort by row */ 46609566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm)); 4661651b1cf9SStefano Zampini 4662651b1cf9SStefano Zampini /* Advance k to the first row with a non-negative index */ 4663651b1cf9SStefano Zampini for (k = 0; k < coo_n; k++) 46649371c9d4SSatish Balay if (i[k] >= 0) break; 4665394ed5ebSJunchao Zhang nneg = k; 46669566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4667394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 466835cb6cd3SPierre Jolivet jmap++; /* Inc jmap by 1 for convenience */ 4669394ed5ebSJunchao Zhang 46709566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M + 1, &Ai)); /* CSR of A */ 46719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4672394ed5ebSJunchao Zhang 4673651b1cf9SStefano Zampini /* Support for HYPRE */ 4674651b1cf9SStefano Zampini PetscBool hypre; 4675651b1cf9SStefano Zampini const char *name; 4676651b1cf9SStefano Zampini PetscCall(PetscObjectGetName((PetscObject)mat, &name)); 4677651b1cf9SStefano Zampini PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre)); 4678651b1cf9SStefano Zampini 4679394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 468035cb6cd3SPierre Jolivet Ai++; /* Inc by 1 for convenience */ 4681394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4682394ed5ebSJunchao Zhang while (k < coo_n) { 4683394ed5ebSJunchao Zhang row = i[k]; 4684394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4685394ed5ebSJunchao Zhang while (k < coo_n && i[k] == row) k++; 4686394ed5ebSJunchao Zhang end = k; 4687651b1cf9SStefano Zampini /* hack for HYPRE: swap min column to diag so that diagonal values will go first */ 4688651b1cf9SStefano Zampini if (hypre) { 4689651b1cf9SStefano Zampini PetscInt minj = PETSC_MAX_INT; 4690651b1cf9SStefano Zampini PetscBool hasdiag = PETSC_FALSE; 4691651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4692651b1cf9SStefano Zampini hasdiag = (PetscBool)(hasdiag || (j[p] == row)); 4693651b1cf9SStefano Zampini minj = PetscMin(minj, j[p]); 4694651b1cf9SStefano Zampini } 4695651b1cf9SStefano Zampini if (hasdiag) { 4696651b1cf9SStefano Zampini for (p = start; p < end; p++) { 4697651b1cf9SStefano Zampini if (j[p] == minj) j[p] = row; 4698651b1cf9SStefano Zampini else if (j[p] == row) j[p] = minj; 4699651b1cf9SStefano Zampini } 4700651b1cf9SStefano Zampini } 4701651b1cf9SStefano Zampini } 47029566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start)); 4703651b1cf9SStefano Zampini 4704394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4705394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4706651b1cf9SStefano Zampini jmap[q] = 1; /* Number of repeats of this nonzero entry */ 4707394ed5ebSJunchao Zhang Ai[row] = 1; 4708394ed5ebSJunchao Zhang nnz++; 4709394ed5ebSJunchao Zhang 4710394ed5ebSJunchao Zhang for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */ 4711394ed5ebSJunchao Zhang if (j[p] != j[p - 1]) { /* Meet a new nonzero */ 4712394ed5ebSJunchao Zhang q++; 4713394ed5ebSJunchao Zhang jmap[q] = 1; 4714394ed5ebSJunchao Zhang Aj[q] = j[p]; 4715394ed5ebSJunchao Zhang Ai[row]++; 4716394ed5ebSJunchao Zhang nnz++; 4717394ed5ebSJunchao Zhang } else { 4718394ed5ebSJunchao Zhang jmap[q]++; 4719394ed5ebSJunchao Zhang } 4720394ed5ebSJunchao Zhang } 4721394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4722394ed5ebSJunchao Zhang } 4723394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4724394ed5ebSJunchao Zhang for (k = 0; k < M; k++) Ai[k + 1] += Ai[k]; 4725394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4726394ed5ebSJunchao Zhang jmap[0] = 0; 4727394ed5ebSJunchao Zhang for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k]; 4728394ed5ebSJunchao Zhang if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */ 4729394ed5ebSJunchao Zhang PetscCount *jmap_new; 4730394ed5ebSJunchao Zhang PetscInt *Aj_new; 4731394ed5ebSJunchao Zhang 47329566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz + 1, &jmap_new)); 47339566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1)); 47349566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4735394ed5ebSJunchao Zhang jmap = jmap_new; 4736394ed5ebSJunchao Zhang 47379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz, &Aj_new)); 47389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new, Aj, nnz)); 47399566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4740394ed5ebSJunchao Zhang Aj = Aj_new; 4741394ed5ebSJunchao Zhang } 4742394ed5ebSJunchao Zhang 4743394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4744394ed5ebSJunchao Zhang PetscCount *perm_new; 4745cbc6b225SStefano Zampini 47469566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n - nneg, &perm_new)); 47479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg)); 47489566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4749394ed5ebSJunchao Zhang perm = perm_new; 4750394ed5ebSJunchao Zhang } 4751394ed5ebSJunchao Zhang 47529566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat, &rtype)); 47539566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */ 47549566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat)); 4755394ed5ebSJunchao Zhang 4756394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4757394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 47582c4ab24aSJunchao Zhang 47592c4ab24aSJunchao Zhang // Put the COO struct in a container and then attach that to the matrix 47602c4ab24aSJunchao Zhang PetscCall(PetscMalloc1(1, &coo)); 47612c4ab24aSJunchao Zhang coo->nz = nnz; 47622c4ab24aSJunchao Zhang coo->n = coo_n; 47632c4ab24aSJunchao Zhang coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again 47642c4ab24aSJunchao Zhang coo->jmap = jmap; // of length nnz+1 47652c4ab24aSJunchao Zhang coo->perm = perm; 47662c4ab24aSJunchao Zhang PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container)); 47672c4ab24aSJunchao Zhang PetscCall(PetscContainerSetPointer(container, coo)); 47682c4ab24aSJunchao Zhang PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ)); 47692c4ab24aSJunchao Zhang PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container)); 47702c4ab24aSJunchao Zhang PetscCall(PetscContainerDestroy(&container)); 47713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4772394ed5ebSJunchao Zhang } 4773394ed5ebSJunchao Zhang 4774d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode) 4775d71ae5a4SJacob Faibussowitsch { 4776394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ *)A->data; 4777394ed5ebSJunchao Zhang PetscCount i, j, Annz = aseq->nz; 47782c4ab24aSJunchao Zhang PetscCount *perm, *jmap; 4779394ed5ebSJunchao Zhang PetscScalar *Aa; 47802c4ab24aSJunchao Zhang PetscContainer container; 47812c4ab24aSJunchao Zhang MatCOOStruct_SeqAIJ *coo; 4782394ed5ebSJunchao Zhang 4783394ed5ebSJunchao Zhang PetscFunctionBegin; 47842c4ab24aSJunchao Zhang PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container)); 47852c4ab24aSJunchao Zhang PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix"); 47862c4ab24aSJunchao Zhang PetscCall(PetscContainerGetPointer(container, (void **)&coo)); 47872c4ab24aSJunchao Zhang perm = coo->perm; 47882c4ab24aSJunchao Zhang jmap = coo->jmap; 47899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A, &Aa)); 4790394ed5ebSJunchao Zhang for (i = 0; i < Annz; i++) { 4791b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4792b6c38306SJunchao Zhang for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]]; 4793b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum; 4794394ed5ebSJunchao Zhang } 47959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A, &Aa)); 47963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4797394ed5ebSJunchao Zhang } 4798394ed5ebSJunchao Zhang 479934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48005063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *); 480102fe1965SBarry Smith #endif 4802d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4803d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *); 4804d5e393b6SSuyash Tandon #endif 48053d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48065063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *); 48073d0639e7SStefano Zampini #endif 480802fe1965SBarry Smith 4809d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4810d71ae5a4SJacob Faibussowitsch { 4811273d9f13SBarry Smith Mat_SeqAIJ *b; 481238baddfdSBarry Smith PetscMPIInt size; 4813273d9f13SBarry Smith 4814273d9f13SBarry Smith PetscFunctionBegin; 48159566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 481608401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1"); 4817273d9f13SBarry Smith 48184dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 48192205254eSKarl Rupp 4820b0a32e0cSBarry Smith B->data = (void *)b; 4821aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 4822071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 48232205254eSKarl Rupp 4824f4259b30SLisandro Dalcin b->row = NULL; 4825f4259b30SLisandro Dalcin b->col = NULL; 4826f4259b30SLisandro Dalcin b->icol = NULL; 4827b810aeb4SBarry Smith b->reallocs = 0; 482836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4829f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4830416022c9SBarry Smith b->nonew = 0; 4831f4259b30SLisandro Dalcin b->diag = NULL; 4832f4259b30SLisandro Dalcin b->solve_work = NULL; 4833f4259b30SLisandro Dalcin B->spptr = NULL; 4834f4259b30SLisandro Dalcin b->saved_values = NULL; 4835f4259b30SLisandro Dalcin b->idiag = NULL; 4836f4259b30SLisandro Dalcin b->mdiag = NULL; 4837f4259b30SLisandro Dalcin b->ssor_work = NULL; 483871f1c65dSBarry Smith b->omega = 1.0; 483971f1c65dSBarry Smith b->fshift = 0.0; 484071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4841bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4842a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 484317ab2063SBarry Smith 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 4845d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB) 48469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ)); 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ)); 4848b3866ffcSBarry Smith #endif 48499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ)); 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ)); 48519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ)); 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ)); 48539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ)); 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM)); 48559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL)); 48569779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL)); 4858191b95cbSRichard Tran Mills #endif 485934b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ)); 486302fe1965SBarry Smith #endif 4864d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 4865d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 4866d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 4867d5e393b6SSuyash Tandon PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ)); 4868d5e393b6SSuyash Tandon #endif 48693d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos)); 48713d0639e7SStefano Zampini #endif 48729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL)); 4873af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental)); 4875af8000cdSHong Zhang #endif 4876d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK)); 4878d24d4204SJose E. Roman #endif 487963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48809566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE)); 48819566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ)); 488263c07aadSStefano Zampini #endif 48839566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense)); 48849566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL)); 48859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS)); 48869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ)); 48879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ)); 48889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ)); 48899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ)); 48909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ)); 48929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ)); 48939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ)); 48949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ)); 48959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ)); 48969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ)); 48979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ)); 48989566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48999566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ)); 49009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 49013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 490217ab2063SBarry Smith } 490317ab2063SBarry Smith 4904b24902e0SBarry Smith /* 49053893b582SJunchao Zhang Given a matrix generated with MatGetFactor() duplicates all the information in A into C 4906b24902e0SBarry Smith */ 4907d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace) 4908d71ae5a4SJacob Faibussowitsch { 49092a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data; 4910071fcb05SBarry Smith PetscInt m = A->rmap->n, i; 491117ab2063SBarry Smith 49123a40ed3dSBarry Smith PetscFunctionBegin; 4913aed4548fSBarry Smith PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 4914273d9f13SBarry Smith 4915d5f3da31SBarry Smith C->factortype = A->factortype; 4916f4259b30SLisandro Dalcin c->row = NULL; 4917f4259b30SLisandro Dalcin c->col = NULL; 4918f4259b30SLisandro Dalcin c->icol = NULL; 49196ad4291fSHong Zhang c->reallocs = 0; 4920bc43efbbSJunchao Zhang c->diagonaldense = a->diagonaldense; 492117ab2063SBarry Smith 492269272f91SPierre Jolivet C->assembled = A->assembled; 492317ab2063SBarry Smith 492469272f91SPierre Jolivet if (A->preallocated) { 49259566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 49269566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 4927eec197d1SBarry Smith 492831fe6a7dSBarry Smith if (!A->hash_active) { 49299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->imax)); 49309566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt))); 49319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &c->ilen)); 49329566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt))); 493317ab2063SBarry Smith 493417ab2063SBarry Smith /* allocate the matrix space */ 4935f77e22a1SHong Zhang if (mallocmatspace) { 49369566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i)); 49372205254eSKarl Rupp 4938f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 49392205254eSKarl Rupp 49409566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, m + 1)); 494117ab2063SBarry Smith if (m > 0) { 49429566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j, a->j, a->i[m])); 4943be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49442e5835c6SStefano Zampini const PetscScalar *aa; 49452e5835c6SStefano Zampini 49469566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 49479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, aa, a->i[m])); 49489566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 4949be6bf707SBarry Smith } else { 49509566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, a->i[m])); 495117ab2063SBarry Smith } 495208480c60SBarry Smith } 4953f77e22a1SHong Zhang } 495431fe6a7dSBarry Smith C->preallocated = PETSC_TRUE; 495531fe6a7dSBarry Smith } else { 495631fe6a7dSBarry Smith PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix"); 495731fe6a7dSBarry Smith PetscCall(MatSetUp(C)); 495831fe6a7dSBarry Smith } 495917ab2063SBarry Smith 49606ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4961416022c9SBarry Smith c->roworiented = a->roworiented; 4962416022c9SBarry Smith c->nonew = a->nonew; 4963416022c9SBarry Smith if (a->diag) { 49649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &c->diag)); 49659566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt))); 4966071fcb05SBarry Smith } else c->diag = NULL; 49672205254eSKarl Rupp 4968f4259b30SLisandro Dalcin c->solve_work = NULL; 4969f4259b30SLisandro Dalcin c->saved_values = NULL; 4970f4259b30SLisandro Dalcin c->idiag = NULL; 4971f4259b30SLisandro Dalcin c->ssor_work = NULL; 4972a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4973e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4974e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49756ad4291fSHong Zhang 4976893ad86cSHong Zhang c->rmax = a->rmax; 4977416022c9SBarry Smith c->nz = a->nz; 49788ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4979754ec7b1SSatish Balay 49806ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49816ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4982cd6b891eSBarry Smith if (a->compressedrow.use) { 49836ad4291fSHong Zhang i = a->compressedrow.nrows; 49849566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex)); 49859566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1)); 49869566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i)); 498727ea64f8SHong Zhang } else { 498827ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49890298fd71SBarry Smith c->compressedrow.i = NULL; 49900298fd71SBarry Smith c->compressedrow.rindex = NULL; 49916ad4291fSHong Zhang } 4992ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4993e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49944846f1f5SKris Buschelman 49959566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C)); 499669272f91SPierre Jolivet } 49979566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 49983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 499917ab2063SBarry Smith } 500017ab2063SBarry Smith 5001d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 5002d71ae5a4SJacob Faibussowitsch { 5003b24902e0SBarry Smith PetscFunctionBegin; 50049566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 50059566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n)); 500648a46eb9SPierre Jolivet if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A)); 50079566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, ((PetscObject)A)->type_name)); 50089566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE)); 50093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5010b24902e0SBarry Smith } 5011b24902e0SBarry Smith 5012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 5013d71ae5a4SJacob Faibussowitsch { 501452f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 501552f91c60SVaclav Hapla 501652f91c60SVaclav Hapla PetscFunctionBegin; 501752f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1); 501852f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2); 5019c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 50209566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 50219566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 50229566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5)); 502352f91c60SVaclav Hapla if (isbinary) { 50249566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer)); 502552f91c60SVaclav Hapla } else if (ishdf5) { 502652f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 50279566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat, viewer)); 502852f91c60SVaclav Hapla #else 502952f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 503052f91c60SVaclav Hapla #endif 503152f91c60SVaclav Hapla } else { 503298921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name); 503352f91c60SVaclav Hapla } 50343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 503552f91c60SVaclav Hapla } 503652f91c60SVaclav Hapla 5037d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 5038d71ae5a4SJacob Faibussowitsch { 50393ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data; 50403ea6fe3dSLisandro Dalcin PetscInt header[4], *rowlens, M, N, nz, sum, rows, cols, i; 5041fbdbba38SShri Abhyankar 5042fbdbba38SShri Abhyankar PetscFunctionBegin; 50439566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5044bbead8a2SBarry Smith 50453ea6fe3dSLisandro Dalcin /* read in matrix header */ 50469566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT)); 504708401ef6SPierre Jolivet PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file"); 50489371c9d4SSatish Balay M = header[1]; 50499371c9d4SSatish Balay N = header[2]; 50509371c9d4SSatish Balay nz = header[3]; 505108401ef6SPierre Jolivet PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M); 505208401ef6SPierre Jolivet PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N); 505308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ"); 5054fbdbba38SShri Abhyankar 50553ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50569566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat, viewer)); 50573ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50583ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50593ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50603ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50613ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50629566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50639566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50643ea6fe3dSLisandro Dalcin 50653ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50669566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5067aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50683ea6fe3dSLisandro Dalcin 5069fbdbba38SShri Abhyankar /* read in row lengths */ 50709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M, &rowlens)); 50719566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT)); 50723ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50739371c9d4SSatish Balay sum = 0; 50749371c9d4SSatish Balay for (i = 0; i < M; i++) sum += rowlens[i]; 507508401ef6SPierre Jolivet PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum); 50763ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50779566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens)); 50789566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat, &rows, &cols)); 5079aed4548fSBarry Smith PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols); 50803ea6fe3dSLisandro Dalcin /* store row lengths */ 50819566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen, rowlens, M)); 50829566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5083fbdbba38SShri Abhyankar 50843ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50859371c9d4SSatish Balay a->i[0] = 0; 50869371c9d4SSatish Balay for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i]; 50873ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50889566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT)); 50893ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50909566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR)); 5091fbdbba38SShri Abhyankar 50929566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY)); 50939566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY)); 50943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5095fbdbba38SShri Abhyankar } 5096fbdbba38SShri Abhyankar 5097d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg) 5098d71ae5a4SJacob Faibussowitsch { 50997264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data; 5100fff043a9SJunchao Zhang const PetscScalar *aa, *ba; 5101eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5102eeffb40dSHong Zhang PetscInt k; 5103eeffb40dSHong Zhang #endif 51047264ac53SSatish Balay 51053a40ed3dSBarry Smith PetscFunctionBegin; 5106bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5107d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) { 5108ca44d042SBarry Smith *flg = PETSC_FALSE; 51093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5110bcd2baecSBarry Smith } 51117264ac53SSatish Balay 51127264ac53SSatish Balay /* if the a->i are the same */ 51139566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg)); 51143ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 51157264ac53SSatish Balay 51167264ac53SSatish Balay /* if a->j are the same */ 51179566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg)); 51183ba16761SJacob Faibussowitsch if (!*flg) PetscFunctionReturn(PETSC_SUCCESS); 5119bcd2baecSBarry Smith 51209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A, &aa)); 51219566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B, &ba)); 5122bcd2baecSBarry Smith /* if a->a are the same */ 5123eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5124eeffb40dSHong Zhang for (k = 0; k < a->nz; k++) { 5125fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5126eeffb40dSHong Zhang *flg = PETSC_FALSE; 51273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5128eeffb40dSHong Zhang } 5129eeffb40dSHong Zhang } 5130eeffb40dSHong Zhang #else 51319566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa, ba, a->nz, flg)); 5132eeffb40dSHong Zhang #endif 51339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A, &aa)); 51349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B, &ba)); 51353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51367264ac53SSatish Balay } 513736db0b34SBarry Smith 513805869f15SSatish Balay /*@ 513911a5261eSBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format) 514036db0b34SBarry Smith provided by the user. 514136db0b34SBarry Smith 5142d083f849SBarry Smith Collective 514336db0b34SBarry Smith 514436db0b34SBarry Smith Input Parameters: 514536db0b34SBarry Smith + comm - must be an MPI communicator of size 1 514636db0b34SBarry Smith . m - number of rows 514736db0b34SBarry Smith . n - number of columns 5148483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 514936db0b34SBarry Smith . j - column indices 515036db0b34SBarry Smith - a - matrix values 515136db0b34SBarry Smith 515236db0b34SBarry Smith Output Parameter: 515336db0b34SBarry Smith . mat - the matrix 515436db0b34SBarry Smith 515536db0b34SBarry Smith Level: intermediate 515636db0b34SBarry Smith 515736db0b34SBarry Smith Notes: 51582ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 5159292fb18eSBarry Smith once the matrix is destroyed and not before 516036db0b34SBarry Smith 516136db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 516236db0b34SBarry Smith 51632ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 516436db0b34SBarry Smith 5165a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5166a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51678eef79e4SBarry Smith as shown 51682ef1f0ffSBarry Smith .vb 51692ef1f0ffSBarry Smith 1 0 0 51702ef1f0ffSBarry Smith 2 0 3 51712ef1f0ffSBarry Smith 4 5 6 5172a4552177SSatish Balay 51732ef1f0ffSBarry Smith i = {0,1,3,6} [size = nrow+1 = 3+1] 51742ef1f0ffSBarry Smith j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51752ef1f0ffSBarry Smith v = {1,2,3,4,5,6} [size = 6] 51762ef1f0ffSBarry Smith .ve 5177a4552177SSatish Balay 51781cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()` 517936db0b34SBarry Smith @*/ 5180d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 5181d71ae5a4SJacob Faibussowitsch { 5182cbcfb4deSHong Zhang PetscInt ii; 518336db0b34SBarry Smith Mat_SeqAIJ *aij; 5184cbcfb4deSHong Zhang PetscInt jj; 518536db0b34SBarry Smith 518636db0b34SBarry Smith PetscFunctionBegin; 5187aed4548fSBarry Smith PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 51889566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 51899566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 51909566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51919566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 51929566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL)); 5193ab93d7beSBarry Smith aij = (Mat_SeqAIJ *)(*mat)->data; 51949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->imax)); 51959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &aij->ilen)); 5196ab93d7beSBarry Smith 519736db0b34SBarry Smith aij->i = i; 519836db0b34SBarry Smith aij->j = j; 519936db0b34SBarry Smith aij->a = a; 520036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 520136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5202e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5203e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 520436db0b34SBarry Smith 5205cbc6b225SStefano Zampini for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) { 520636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii]; 520776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 5208aed4548fSBarry Smith PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 52099985e31cSBarry Smith for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) { 521008401ef6SPierre Jolivet PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii); 521108401ef6SPierre Jolivet PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii); 52129985e31cSBarry Smith } 521336db0b34SBarry Smith } 521476bd3646SJed Brown } 521576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 521636db0b34SBarry Smith for (ii = 0; ii < aij->i[m]; ii++) { 521708401ef6SPierre Jolivet PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 5218aed4548fSBarry Smith PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 521936db0b34SBarry Smith } 522076bd3646SJed Brown } 522136db0b34SBarry Smith 52229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 522536db0b34SBarry Smith } 5226cbc6b225SStefano Zampini 5227f62e3866SBarry Smith /*@ 522811a5261eSBarry Smith MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format) 52298a0b0e6bSVictor Minden provided by the user. 52308a0b0e6bSVictor Minden 5231d083f849SBarry Smith Collective 52328a0b0e6bSVictor Minden 52338a0b0e6bSVictor Minden Input Parameters: 52348a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 52358a0b0e6bSVictor Minden . m - number of rows 52368a0b0e6bSVictor Minden . n - number of columns 52378a0b0e6bSVictor Minden . i - row indices 52388a0b0e6bSVictor Minden . j - column indices 52391230e6d1SVictor Minden . a - matrix values 52401230e6d1SVictor Minden . nz - number of nonzeros 52412ef1f0ffSBarry Smith - idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE` 52428a0b0e6bSVictor Minden 52438a0b0e6bSVictor Minden Output Parameter: 52448a0b0e6bSVictor Minden . mat - the matrix 52458a0b0e6bSVictor Minden 52468a0b0e6bSVictor Minden Level: intermediate 52478a0b0e6bSVictor Minden 5248f62e3866SBarry Smith Example: 5249f62e3866SBarry Smith For the following matrix, the input data expected is as shown (using 0 based indexing) 52509e99939fSJunchao Zhang .vb 52518a0b0e6bSVictor Minden 1 0 0 52528a0b0e6bSVictor Minden 2 0 3 52538a0b0e6bSVictor Minden 4 5 6 52548a0b0e6bSVictor Minden 52558a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52568a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52578a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52589e99939fSJunchao Zhang .ve 5259fe59aa6dSJacob Faibussowitsch 52602ef1f0ffSBarry Smith Note: 5261d7547e51SJunchao Zhang Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries, 5262d7547e51SJunchao Zhang and are particularly useful in iterative applications. 52638a0b0e6bSVictor Minden 52641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()` 52658a0b0e6bSVictor Minden @*/ 5266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx) 5267d71ae5a4SJacob Faibussowitsch { 5268d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1, row, col; 52698a0b0e6bSVictor Minden 52708a0b0e6bSVictor Minden PetscFunctionBegin; 52719566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m, &nnz)); 5272ad540459SPierre Jolivet for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1; 52739566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 52749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 52759566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQAIJ)); 52769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz)); 52771230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52781230e6d1SVictor Minden if (idx) { 52791230e6d1SVictor Minden row = i[ii] - 1; 52801230e6d1SVictor Minden col = j[ii] - 1; 52811230e6d1SVictor Minden } else { 52821230e6d1SVictor Minden row = i[ii]; 52831230e6d1SVictor Minden col = j[ii]; 52848a0b0e6bSVictor Minden } 52859566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES)); 52868a0b0e6bSVictor Minden } 52879566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 52889566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 52899566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52918a0b0e6bSVictor Minden } 529236db0b34SBarry Smith 5293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5294d71ae5a4SJacob Faibussowitsch { 5295acf2f550SJed Brown Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5296acf2f550SJed Brown 5297acf2f550SJed Brown PetscFunctionBegin; 5298acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5299acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 53002205254eSKarl Rupp 53019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 53023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5303acf2f550SJed Brown } 5304acf2f550SJed Brown 5305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 5306d71ae5a4SJacob Faibussowitsch { 53079c8f2541SHong Zhang PetscFunctionBegin; 53089566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat)); 53093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53109c8f2541SHong Zhang } 53119c8f2541SHong Zhang 531281824310SBarry Smith /* 531353dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 531453dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 531553dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 531653dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 531753dd7562SDmitry Karpeev */ 5318d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B) 5319d71ae5a4SJacob Faibussowitsch { 532053dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 532153dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 532253dd7562SDmitry Karpeev PetscBool seqaij; 532353dd7562SDmitry Karpeev PetscInt m, n, *nz, i, j, count; 532453dd7562SDmitry Karpeev PetscScalar v; 532553dd7562SDmitry Karpeev const PetscInt *rowindices, *colindices; 532653dd7562SDmitry Karpeev 532753dd7562SDmitry Karpeev PetscFunctionBegin; 53283ba16761SJacob Faibussowitsch if (!B) PetscFunctionReturn(PETSC_SUCCESS); 532953dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53309566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij)); 533128b400f6SJacob Faibussowitsch PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type"); 533253dd7562SDmitry Karpeev if (rowemb) { 53339566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb, &m)); 533408401ef6SPierre Jolivet PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n); 533553dd7562SDmitry Karpeev } else { 533608401ef6SPierre Jolivet PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix"); 533753dd7562SDmitry Karpeev } 533853dd7562SDmitry Karpeev if (colemb) { 53399566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb, &n)); 534008401ef6SPierre Jolivet PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n); 534153dd7562SDmitry Karpeev } else { 534208401ef6SPierre Jolivet PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix"); 534353dd7562SDmitry Karpeev } 534453dd7562SDmitry Karpeev 534553dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ *)(B->data); 534653dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n, &nz)); 5348ad540459SPierre Jolivet for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i]; 53499566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C, 0, nz)); 53509566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 535153dd7562SDmitry Karpeev } 535248a46eb9SPierre Jolivet if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C)); 535353dd7562SDmitry Karpeev count = 0; 535453dd7562SDmitry Karpeev rowindices = NULL; 535553dd7562SDmitry Karpeev colindices = NULL; 535648a46eb9SPierre Jolivet if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices)); 535748a46eb9SPierre Jolivet if (colemb) PetscCall(ISGetIndices(colemb, &colindices)); 535853dd7562SDmitry Karpeev for (i = 0; i < B->rmap->n; i++) { 535953dd7562SDmitry Karpeev PetscInt row; 536053dd7562SDmitry Karpeev row = i; 536153dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 536253dd7562SDmitry Karpeev for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) { 536353dd7562SDmitry Karpeev PetscInt col; 536453dd7562SDmitry Karpeev col = Baij->j[count]; 536553dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 536653dd7562SDmitry Karpeev v = Baij->a[count]; 53679566063dSJacob Faibussowitsch PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES)); 536853dd7562SDmitry Karpeev ++count; 536953dd7562SDmitry Karpeev } 537053dd7562SDmitry Karpeev } 537153dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 537253dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 537353dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 537453dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 537553dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 53763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 537753dd7562SDmitry Karpeev } 537853dd7562SDmitry Karpeev 537958c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep) 5380dec0b466SHong Zhang { 5381dec0b466SHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 5382dec0b466SHong Zhang MatScalar *aa = a->a; 5383dec0b466SHong Zhang PetscInt m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k; 5384dec0b466SHong Zhang PetscInt *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0; 5385dec0b466SHong Zhang 5386dec0b466SHong Zhang PetscFunctionBegin; 5387dec0b466SHong Zhang PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 5388dec0b466SHong Zhang if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 5389dec0b466SHong Zhang for (i = 1; i <= m; i++) { 5390dec0b466SHong Zhang /* move each nonzero entry back by the amount of zero slots (fshift) before it*/ 5391dec0b466SHong Zhang for (k = ai[i - 1]; k < ai[i]; k++) { 539258c11ad4SPierre Jolivet if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++; 5393dec0b466SHong Zhang else { 5394dec0b466SHong Zhang if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1)); 5395dec0b466SHong Zhang aa[k - fshift] = aa[k]; 5396dec0b466SHong Zhang aj[k - fshift] = aj[k]; 5397dec0b466SHong Zhang } 5398dec0b466SHong Zhang } 5399dec0b466SHong Zhang ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration 5400dec0b466SHong Zhang fshift_prev = fshift; 5401dec0b466SHong Zhang /* reset ilen and imax for each row */ 5402dec0b466SHong Zhang ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 5403dec0b466SHong Zhang a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 5404dec0b466SHong Zhang rmax = PetscMax(rmax, ailen[i - 1]); 5405dec0b466SHong Zhang } 5406312eded4SPierre Jolivet if (fshift) { 5407dec0b466SHong Zhang if (m) { 5408dec0b466SHong Zhang ai[m] -= fshift; 5409dec0b466SHong Zhang a->nz = ai[m]; 5410dec0b466SHong Zhang } 5411dec0b466SHong Zhang PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 5412312eded4SPierre Jolivet A->nonzerostate++; 5413dec0b466SHong Zhang A->info.nz_unneeded += (PetscReal)fshift; 5414dec0b466SHong Zhang a->rmax = rmax; 5415dec0b466SHong Zhang if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A)); 5416dec0b466SHong Zhang PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 5417dec0b466SHong Zhang PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 5418312eded4SPierre Jolivet } 54193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 5420dec0b466SHong Zhang } 5421dec0b466SHong Zhang 54224099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 54234099cc6bSBarry Smith 54244099cc6bSBarry Smith /*@C 542511a5261eSBarry Smith MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype 54264099cc6bSBarry Smith 5427c3339decSBarry Smith Collective 54284099cc6bSBarry Smith 54294099cc6bSBarry Smith Input Parameters: 54304099cc6bSBarry Smith + mat - the matrix object 54314099cc6bSBarry Smith - matype - matrix type 54324099cc6bSBarry Smith 54334099cc6bSBarry Smith Options Database Key: 54344e187271SRichard Tran Mills . -mat_seqaij_type <method> - for example seqaijcrl 54354099cc6bSBarry Smith 54364099cc6bSBarry Smith Level: intermediate 54374099cc6bSBarry Smith 5438fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType` 54394099cc6bSBarry Smith @*/ 5440d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 5441d71ae5a4SJacob Faibussowitsch { 54424099cc6bSBarry Smith PetscBool sametype; 54435f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *); 54444099cc6bSBarry Smith 54454099cc6bSBarry Smith PetscFunctionBegin; 54464099cc6bSBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 54479566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype)); 54483ba16761SJacob Faibussowitsch if (sametype) PetscFunctionReturn(PETSC_SUCCESS); 54494099cc6bSBarry Smith 54509566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r)); 54516adde796SStefano Zampini PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype); 54529566063dSJacob Faibussowitsch PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat)); 54533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54544099cc6bSBarry Smith } 54554099cc6bSBarry Smith 54564099cc6bSBarry Smith /*@C 545711a5261eSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices 54584099cc6bSBarry Smith 54594099cc6bSBarry Smith Not Collective 54604099cc6bSBarry Smith 54614099cc6bSBarry Smith Input Parameters: 5462fe59aa6dSJacob Faibussowitsch + sname - name of a new user-defined matrix type, for example `MATSEQAIJCRL` 54634099cc6bSBarry Smith - function - routine to convert to subtype 54644099cc6bSBarry Smith 54652ef1f0ffSBarry Smith Level: advanced 54662ef1f0ffSBarry Smith 54674099cc6bSBarry Smith Notes: 546811a5261eSBarry Smith `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers. 54694099cc6bSBarry Smith 54704099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54714099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54724099cc6bSBarry Smith 54731cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()` 54744099cc6bSBarry Smith @*/ 5475d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *)) 5476d71ae5a4SJacob Faibussowitsch { 54774099cc6bSBarry Smith PetscFunctionBegin; 54789566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54799566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function)); 54803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54814099cc6bSBarry Smith } 54824099cc6bSBarry Smith 54834099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54844099cc6bSBarry Smith 54854099cc6bSBarry Smith /*@C 548611a5261eSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ` 54874099cc6bSBarry Smith 54884099cc6bSBarry Smith Not Collective 54894099cc6bSBarry Smith 54904099cc6bSBarry Smith Level: advanced 54914099cc6bSBarry Smith 54922ef1f0ffSBarry Smith Note: 54932ef1f0ffSBarry Smith This registers the versions of `MATSEQAIJ` for GPUs 54942ef1f0ffSBarry Smith 54951cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()` 54964099cc6bSBarry Smith @*/ 5497d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void) 5498d71ae5a4SJacob Faibussowitsch { 54994099cc6bSBarry Smith PetscFunctionBegin; 55003ba16761SJacob Faibussowitsch if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS); 55014099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 55024099cc6bSBarry Smith 55039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 55049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 55059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 55069779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 55079566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5508485f9817SRichard Tran Mills #endif 55095063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 55109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 55115063d097SStefano Zampini #endif 5512d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP) 5513d5e393b6SSuyash Tandon PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE)); 5514d5e393b6SSuyash Tandon #endif 55155063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 55169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 55175063d097SStefano Zampini #endif 55184099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 55199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 55204099cc6bSBarry Smith #endif 55213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55224099cc6bSBarry Smith } 552353dd7562SDmitry Karpeev 552453dd7562SDmitry Karpeev /* 552581824310SBarry Smith Special version for direct calls from Fortran 552681824310SBarry Smith */ 5527af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 552881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 552981824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 553081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 553181824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 553281824310SBarry Smith #endif 553381824310SBarry Smith 553481824310SBarry Smith /* Change these macros so can be used in void function */ 553598921bdaSJacob Faibussowitsch 553698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 55379566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 55389566063dSJacob Faibussowitsch #undef PetscCall 55399371c9d4SSatish Balay #define PetscCall(...) \ 55409371c9d4SSatish Balay do { \ 55415f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 554298921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 554398921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \ 554498921bdaSJacob Faibussowitsch return; \ 554598921bdaSJacob Faibussowitsch } \ 554698921bdaSJacob Faibussowitsch } while (0) 554798921bdaSJacob Faibussowitsch 554898921bdaSJacob Faibussowitsch #undef SETERRQ 55499371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \ 55509371c9d4SSatish Balay do { \ 555198921bdaSJacob Faibussowitsch *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \ 555298921bdaSJacob Faibussowitsch return; \ 555398921bdaSJacob Faibussowitsch } while (0) 555481824310SBarry Smith 5555d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr) 5556d71ae5a4SJacob Faibussowitsch { 555781824310SBarry Smith Mat A = *AA; 555881824310SBarry Smith PetscInt m = *mm, n = *nn; 555981824310SBarry Smith InsertMode is = *isis; 556081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data; 556181824310SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N; 556281824310SBarry Smith PetscInt *imax, *ai, *ailen; 556381824310SBarry Smith PetscInt *aj, nonew = a->nonew, lastcol = -1; 556454f21887SBarry Smith MatScalar *ap, value, *aa; 5565ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5566ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 556781824310SBarry Smith 556881824310SBarry Smith PetscFunctionBegin; 55694994cf47SJed Brown MatCheckPreallocated(A, 1); 557081824310SBarry Smith imax = a->imax; 557181824310SBarry Smith ai = a->i; 557281824310SBarry Smith ailen = a->ilen; 557381824310SBarry Smith aj = a->j; 557481824310SBarry Smith aa = a->a; 557581824310SBarry Smith 557681824310SBarry Smith for (k = 0; k < m; k++) { /* loop over added rows */ 557781824310SBarry Smith row = im[k]; 557881824310SBarry Smith if (row < 0) continue; 55795f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large"); 55809371c9d4SSatish Balay rp = aj + ai[row]; 55819371c9d4SSatish Balay ap = aa + ai[row]; 55829371c9d4SSatish Balay rmax = imax[row]; 55839371c9d4SSatish Balay nrow = ailen[row]; 558481824310SBarry Smith low = 0; 558581824310SBarry Smith high = nrow; 558681824310SBarry Smith for (l = 0; l < n; l++) { /* loop over added columns */ 558781824310SBarry Smith if (in[l] < 0) continue; 55885f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large"); 558981824310SBarry Smith col = in[l]; 55902205254eSKarl Rupp if (roworiented) value = v[l + k * n]; 55912205254eSKarl Rupp else value = v[k + l * m]; 55922205254eSKarl Rupp 559381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 559481824310SBarry Smith 55952205254eSKarl Rupp if (col <= lastcol) low = 0; 55962205254eSKarl Rupp else high = nrow; 559781824310SBarry Smith lastcol = col; 559881824310SBarry Smith while (high - low > 5) { 559981824310SBarry Smith t = (low + high) / 2; 560081824310SBarry Smith if (rp[t] > col) high = t; 560181824310SBarry Smith else low = t; 560281824310SBarry Smith } 560381824310SBarry Smith for (i = low; i < high; i++) { 560481824310SBarry Smith if (rp[i] > col) break; 560581824310SBarry Smith if (rp[i] == col) { 560681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 560781824310SBarry Smith else ap[i] = value; 560881824310SBarry Smith goto noinsert; 560981824310SBarry Smith } 561081824310SBarry Smith } 561181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 561281824310SBarry Smith if (nonew == 1) goto noinsert; 56135f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix"); 5614fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 56159371c9d4SSatish Balay N = nrow++ - 1; 56169371c9d4SSatish Balay a->nz++; 56179371c9d4SSatish Balay high++; 561881824310SBarry Smith /* shift up all the later entries in this row */ 561981824310SBarry Smith for (ii = N; ii >= i; ii--) { 562081824310SBarry Smith rp[ii + 1] = rp[ii]; 562181824310SBarry Smith ap[ii + 1] = ap[ii]; 562281824310SBarry Smith } 562381824310SBarry Smith rp[i] = col; 562481824310SBarry Smith ap[i] = value; 5625e56f5c9eSBarry Smith A->nonzerostate++; 562681824310SBarry Smith noinsert:; 562781824310SBarry Smith low = i + 1; 562881824310SBarry Smith } 562981824310SBarry Smith ailen[row] = nrow; 563081824310SBarry Smith } 563181824310SBarry Smith PetscFunctionReturnVoid(); 563281824310SBarry Smith } 563398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 563498921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 563598921bdaSJacob Faibussowitsch * original definitions */ 56369566063dSJacob Faibussowitsch #undef PetscCall 563798921bdaSJacob Faibussowitsch #undef SETERRQ 5638